Papers
- Back
Contrastive Integrated Gradients: A Feature Attribution-Based Method for Explaining Whole Slide Image Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Vu_2026_WACV, author = {Vu, Anh Mai and Vo, Tuan L. and Bui, Ngoc Lam Quang and Le, Nam N. B. and Awasthi, Akash and Vo, Huy Q. and Nguyen, Thanh-Huy and Han, Zhu and Mohan, Chandra and Van Nguyen, Hien}, title = {Contrastive Integrated Gradients: A Feature Attribution-Based Method for Explaining Whole Slide Image Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1201-1210} }
Forget Less by Learning Together through Concept Consolidation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kaushik_2026_WACV, author = {Kaushik, Arjun Ramesh and Devulapally, Naresh Kumar and Lokhande, Vishnu Suresh and Ratha, Nalini and Govindaraju, Venu}, title = {Forget Less by Learning Together through Concept Consolidation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {265-275} }
MMCM: Multimodality-aware Metric using Clustering-based Modes for Probabilistic Human Motion Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tokoro_2026_WACV, author = {Tokoro, Kyotaro and Taketsugu, Hiromu and Ukita, Norimichi}, title = {MMCM: Multimodality-aware Metric using Clustering-based Modes for Probabilistic Human Motion Prediction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2637-2647} }
ScoliGaitX: A Deep Multi-Modal Fusion Network for Scoliosis Assessment via Gait Video Analysis-
[pdf]
[bibtex]@InProceedings{Vishwakarma_2026_WACV, author = {Vishwakarma, Kaushik and Nigam, Aditya}, title = {ScoliGaitX: A Deep Multi-Modal Fusion Network for Scoliosis Assessment via Gait Video Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2404-2413} }
OpenCowID: Zero-Shot Visual Identification of Dairy Cows-
[pdf]
[bibtex]@InProceedings{Prabhune_2026_WACV, author = {Prabhune, Omkar and Kim, Younghyun}, title = {OpenCowID: Zero-Shot Visual Identification of Dairy Cows}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1491-1500} }
SpikeRain: Towards Energy-Efficient Single Image Deraining with Spiking Neural Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Islam_2026_WACV, author = {Islam, Md Tanvir and Alam, Inzamamul and Bakshi, Sambit and Muhammad, Khan and Del Ser, Javier and Ahn, Sangtae}, title = {SpikeRain: Towards Energy-Efficient Single Image Deraining with Spiking Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1094-1105} }
SynPlay: Large-Scale Synthetic Human Data with Real-World Diversity for Aerial-View Perception-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yim_2026_WACV, author = {Yim, Jinsub and Lee, Hyungtae and Eum, Sungmin and Shen, Yi-Ting and Zhang, Yan and Kwon, Heesung and Bhattacharyya, Shuvra S.}, title = {SynPlay: Large-Scale Synthetic Human Data with Real-World Diversity for Aerial-View Perception}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {938-947} }
OW-Rep: Open World Object Detection with Instance Representation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Sunoh and Jeon, Minsik and Min, Jihong and Seo, Junwon}, title = {OW-Rep: Open World Object Detection with Instance Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {339-349} }
Training-free Multi-view 4D Human Motion Reconstruction Virtual Reality System-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Yijie and Zheng, Ce and He, Yijie and Julin, Joel and Ichikari, Ryosuke and Ogiso, Satoki and Nakae, Satoshi and Sato, Akihiro and Kurata, Takeshi and Jeni, Laszlo A.}, title = {Training-free Multi-view 4D Human Motion Reconstruction Virtual Reality System}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {318-327} }
Beyond the Encoder: Joint Encoder-Decoder Contrastive Pre-Training Improves Dense Prediction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Quetin_2026_WACV, author = {Quetin, S\'ebastien and Ghosh, Tapotosh and Maleki, Farhad}, title = {Beyond the Encoder: Joint Encoder-Decoder Contrastive Pre-Training Improves Dense Prediction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1000-1010} }
Discrete Facial Encoding: A Framework for Data-driven Facial Display Discovery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tran_2026_WACV, author = {Tran, Minh and Siniukov, Maksim and Jin, Zhangyu and Soleymani, Mohammad}, title = {Discrete Facial Encoding: A Framework for Data-driven Facial Display Discovery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2348-2358} }
Zero-shot Hierarchical Plant Segmentation via Foundation Segmentation Models and Text-to-image Attention-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xing_2026_WACV, author = {Xing, Junhao and Miyakawa, Ryohei and Yang, Yang and Liu, Xinpeng and Shinoda, Risa and Santo, Hiroaki and Toda, Yosuke and Okura, Fumio}, title = {Zero-shot Hierarchical Plant Segmentation via Foundation Segmentation Models and Text-to-image Attention}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2510-2519} }
VISTA: A Vision and Intent-Aware Social Attention Framework for Multi-Agent Trajectory Prediction-
[pdf]
[supp]
[bibtex]@InProceedings{Da_Silva_Martins_2026_WACV, author = {Da Silva Martins, Stephane and Aldea, Emanuel and Le H\'egarat-Mascle, Sylvie}, title = {VISTA: A Vision and Intent-Aware Social Attention Framework for Multi-Agent Trajectory Prediction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {287-296} }
WWE-UIE: A Wavelet & White Balance Efficient Network for Underwater Image Enhancement-
[pdf]
[arXiv]
[bibtex]@InProceedings{Cheng_2026_WACV, author = {Cheng, Ching-Heng and Lee, Jen-Wei and Lee, Chia-Ming and Hsu, Chih-Chung}, title = {WWE-UIE: A Wavelet \& White Balance Efficient Network for Underwater Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2135-2145} }
DenseBEV: Transforming BEV Grid Cells into 3D Objects-
[pdf]
[supp]
[bibtex]@InProceedings{Dahling_2026_WACV, author = {D\"ahling, Marius and Krebs, Sebastian and Z\"ollner, J. Marius}, title = {DenseBEV: Transforming BEV Grid Cells into 3D Objects}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2370-2379} }
Enhanced Back-Projection of Vision Features for 3D Symmetry Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Aguirre_2026_WACV, author = {Aguirre, Isaac and Sipiran, Ivan}, title = {Enhanced Back-Projection of Vision Features for 3D Symmetry Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {66-76} }
Tables Guide Vision: Learning to See the Heart through Tabular Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hasny_2026_WACV, author = {Hasny, Marta and Di Folco, Maxime and Bressem, Keno and Schnabel, Julia}, title = {Tables Guide Vision: Learning to See the Heart through Tabular Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1716-1725} }
RapidMV: Leveraging Spatio-Angular Latent Space for Efficient and Consistent Text-to-Multi-View Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Seungwook and Shi, Yichun and Li, Kejie and Cho, Minsu and Wang, Peng}, title = {RapidMV: Leveraging Spatio-Angular Latent Space for Efficient and Consistent Text-to-Multi-View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1674-1684} }
BrandFusion: Aligning Image Generation with Brand Styles-
[pdf]
[supp]
[bibtex]@InProceedings{Gupta_2026_WACV, author = {Gupta, Parul and Khurana, Varun and Singla, Yaman Kumar and Krishnamurthy, Balaji and Dhall, Abhinav}, title = {BrandFusion: Aligning Image Generation with Brand Styles}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2316-2326} }
Reverse Personalization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kung_2026_WACV, author = {Kung, Han-Wei and Varanka, Tuomas and Sebe, Nicu}, title = {Reverse Personalization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {988-999} }
SmokeBench: Evaluating Multimodal Large Language Models for Wildfire Smoke Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qi_2026_WACV, author = {Qi, Tianye and Li, Weihao and Barnes, Nick}, title = {SmokeBench: Evaluating Multimodal Large Language Models for Wildfire Smoke Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1043-1053} }
Temporal Object Captioning for Street Scene Videos from LiDAR Tracks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gopinathan_2026_WACV, author = {Gopinathan, Vignesh and Zimmermann, Urs and Arnold, Michael and Rottmann, Matthias}, title = {Temporal Object Captioning for Street Scene Videos from LiDAR Tracks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2848-2857} }
MDUNet: Multimodal Decoding UNet for Passive Occluder-Aided Non-line-of-sight 3D Imaging-
[pdf]
[supp]
[bibtex]@InProceedings{Raji_2026_WACV, author = {Raji, Fadlullah and Murray-Bruce, John}, title = {MDUNet: Multimodal Decoding UNet for Passive Occluder-Aided Non-line-of-sight 3D Imaging}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {461-471} }
FALCONEye: Finding Answers and Localizing Content in ONE-hour-long videos with multi-modal LLMs-
[pdf]
[supp]
[bibtex]@InProceedings{Plou_2026_WACV, author = {Plou, Carlos and Borja, Cesar and Martinez-Cantin, Ruben and Murillo, Ana C.}, title = {FALCONEye: Finding Answers and Localizing Content in ONE-hour-long videos with multi-modal LLMs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1334-1344} }
Enabling High-Quality In-the-Wild Imaging from Severely Aberrated Metalens Bursts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mandal_2026_WACV, author = {Mandal, Debabrata and Peng, Zhihan and Wang, Yujie and Chakravarthula, Praneeth}, title = {Enabling High-Quality In-the-Wild Imaging from Severely Aberrated Metalens Bursts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {849-859} }
From Bands to Depth: Understanding Bathymetry Decisions on Sentinel-2-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chowdhury_2026_WACV, author = {Chowdhury, Satyaki Roy and Radhakrishnan, Aswathnarayan and Subramoni, Hari}, title = {From Bands to Depth: Understanding Bathymetry Decisions on Sentinel-2}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2063-2072} }
Conjuring Positive Pairs for Efficient Unification of Representation Learning and Image Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Estepa_2026_WACV, author = {Estepa, Imanol G. and Rodr{\'\i}guez-de-Vera, Jes\'us M. and Saras\'ua, Ignacio and Nagarajan, Bhalaji and Radeva, Petia}, title = {Conjuring Positive Pairs for Efficient Unification of Representation Learning and Image Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {751-761} }
Root Completion from Intraoral Scans of Tooth Crowns using Diffusion with Patch Perturbation-
[pdf]
[bibtex]@InProceedings{Jang_2026_WACV, author = {Jang, Yohan and Song, In-Seok and Baek, Seung Jun}, title = {Root Completion from Intraoral Scans of Tooth Crowns using Diffusion with Patch Perturbation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {483-492} }
FlowMorph: Revealing an Optimizable Flow Latent Space for Controlled Image Morphing-
[pdf]
[supp]
[bibtex]@InProceedings{Zheng_2026_WACV, author = {Zheng, Yan and Yang, Yi and Guo, Lanqing and Wang, Zhangyang}, title = {FlowMorph: Revealing an Optimizable Flow Latent Space for Controlled Image Morphing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2455-2464} }
Boosting Medical Vision-Language Pretraining via Momentum Self-Distillation under Limited Computing Resources-
[pdf]
[arXiv]
[bibtex]@InProceedings{Pham_2026_WACV, author = {Pham, Phuc and Pham, Nhu and Ly, Ngoc Quoc}, title = {Boosting Medical Vision-Language Pretraining via Momentum Self-Distillation under Limited Computing Resources}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {860-868} }
MR-Pruner: Training-free Multi-resolution Visual Token Pruning for Multi-modal Large Language Models-
[pdf]
[bibtex]@InProceedings{Han_2026_WACV, author = {Han, Seunghoon and Lee, Hyewon and Park, Soyoung and Lee, Jong-Ryul and Lim, Sungsu}, title = {MR-Pruner: Training-free Multi-resolution Visual Token Pruning for Multi-modal Large Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1084-1093} }
Descrip3D: Enhancing Large Language Model-based 3D Scene Understanding with Object-Level Text Descriptions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xue_2026_WACV, author = {Xue, Jintang and Zhao, Ganning and Yao, Jie-En and Chen, Hong-En and Hu, Yue and Chen, Meida and You, Suya and Kuo, C.-C. Jay}, title = {Descrip3D: Enhancing Large Language Model-based 3D Scene Understanding with Object-Level Text Descriptions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1746-1756} }
1LoRA: Summation Compression for Very Low-Rank Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Quercia_2026_WACV, author = {Quercia, Alessio and Cao, Zhuo and Bangun, Arya and Paul, Richard D. and Morrison, Abigail and Assent, Ira and Scharr, Hanno}, title = {1LoRA: Summation Compression for Very Low-Rank Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2253-2262} }
Conditional Text-to-Image Generation with Reference Guidance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Taewook and Wang, Ze and Yang, Zhengyuan and Wang, Jiang and Wang, Lijuan and Liu, Zicheng and Qiu, Qiang}, title = {Conditional Text-to-Image Generation with Reference Guidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2879-2889} }
Deepfake Detection that Generalizes Across Benchmarks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yermakov_2026_WACV, author = {Yermakov, Andrii and Cech, Jan and Matas, Jiri and Fritz, Mario}, title = {Deepfake Detection that Generalizes Across Benchmarks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {773-783} }
CycleSL: Server-Client Cyclical Update Driven Scalable Split Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Mengdi and Bozkir, Efe and Kasneci, Enkelejda}, title = {CycleSL: Server-Client Cyclical Update Driven Scalable Split Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1841-1851} }
From SAM to DINOv2: Towards Distilling Foundation Models to Lightweight Baselines for Generalized Polyp Segmentation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Agnihotri_2026_WACV, author = {Agnihotri, Shivanshu and Majhi, Snehashis and Nayak, Deepak Ranjan and Jha, Debesh}, title = {From SAM to DINOv2: Towards Distilling Foundation Models to Lightweight Baselines for Generalized Polyp Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1757-1766} }
Graph-Based Spectral Attention with Multi-Spectral Images for Illuminant Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Kang_2026_WACV, author = {Kang, Dong-Hoon and Baek, Seung-Yeop and Kim, Jong-Ok}, title = {Graph-Based Spectral Attention with Multi-Spectral Images for Illuminant Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2912-2922} }
Knowledge to Sight: Reasoning over Visual Attributes via Knowledge Decomposition for Abnormality Grounding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Jun and Liu, Che and Bai, Wenjia and Liu, Mingxuan and Arcucci, Rossella and Bercea, Cosmin I. and Schnabel, Julia}, title = {Knowledge to Sight: Reasoning over Visual Attributes via Knowledge Decomposition for Abnormality Grounding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2359-2369} }
4D-Animal: Freely Reconstructing Animatable 3D Animals from Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhong_2026_WACV, author = {Zhong, Shanshan and Peng, Jiawei and Zheng, Zehan and Huang, Zhongzhan and Ma, Wufei and Zhang, Guofeng and Liu, Qihao and Yuille, Alan and Chen, Jieneng}, title = {4D-Animal: Freely Reconstructing Animatable 3D Animals from Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {602-612} }
PVeRA: Probabilistic Vector-Based Random Matrix Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Fillioux_2026_WACV, author = {Fillioux, Leo and Ferrante, Enzo and Courn\`ede, Paul-Henry and Vakalopoulou, Maria and Christodoulidis, Stergios}, title = {PVeRA: Probabilistic Vector-Based Random Matrix Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2465-2474} }
Improved Wildfire Spread Prediction with Time-Series Data and the WSTS+ Benchmark-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lahrichi_2026_WACV, author = {Lahrichi, Saad and Bova, Jake and Johnson, Jesse and Malof, Jordan}, title = {Improved Wildfire Spread Prediction with Time-Series Data and the WSTS+ Benchmark}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2890-2900} }
CADE: Continual Weakly-supervised Video Anomaly Detection with Ensembles-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hashimoto_2026_WACV, author = {Hashimoto, Satoshi and Konishi, Tatsuya and Kaichi, Tomoya and Matsumoto, Kazunori and Kurokawa, Mori}, title = {CADE: Continual Weakly-supervised Video Anomaly Detection with Ensembles}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {708-717} }
DOODLE: Diffusion-based Out-of-Distribution Learning for Open-set LiDAR Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Oh_2026_WACV, author = {Oh, Changgyoon and Kim, Hyeonseong and We, Daehyun and Jeong, Jongoh and Chae, Yujeong and Yoon, Kuk-Jin}, title = {DOODLE: Diffusion-based Out-of-Distribution Learning for Open-set LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2273-2283} }
RobustFormer: Noise-Robust Pre-training for Images and Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bastola_2026_WACV, author = {Bastola, Ashish and Luitel, Nishant and Wang, Hao and Paudel, Danda Pani and Poudel, Roshni and Razi, Abolfazl}, title = {RobustFormer: Noise-Robust Pre-training for Images and Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2284-2294} }
Reviving Unsupervised Optical Flow: Concept Reevaluation, Multi-Scale Advances and Full Open-Source Release-
[pdf]
[supp]
[bibtex]@InProceedings{Jahedi_2026_WACV, author = {Jahedi, Azin and Rivinius, Marc and Senn, Noah Berenguel and Bruhn, Andres}, title = {Reviving Unsupervised Optical Flow: Concept Reevaluation, Multi-Scale Advances and Full Open-Source Release}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1533-1542} }
STARS: Self-supervised Tuning for 3D Action Recognition in Skeleton Sequences-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mehraban_2026_WACV, author = {Mehraban, Soroush and Rajabi, Mohammad Javad and Iaboni, Andrea and Taati, Babak}, title = {STARS: Self-supervised Tuning for 3D Action Recognition in Skeleton Sequences}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2858-2868} }
ConsensusXAI: A Framework to Examine Class-wise Agreement in Medical Imaging-
[pdf]
[supp]
[bibtex]@InProceedings{Haider_2026_WACV, author = {Haider, Abbas and Wright, David and Hogg, Ruth and Wang, Hui and Peto, Tunde and Gault, Richard}, title = {ConsensusXAI: A Framework to Examine Class-wise Agreement in Medical Imaging}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2661-2669} }
Anatomy-VLM: A Fine-grained Vision-Language Model for Medical Interpretation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gu_2026_WACV, author = {Gu, Difei and Gao, Yunhe and Zhou, Mu and Metaxas, Dimitris}, title = {Anatomy-VLM: A Fine-grained Vision-Language Model for Medical Interpretation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2838-2847} }
milliMamba: Specular-Aware Human Pose Estimation via Dual mmWave Radar with Multi-Frame Mamba Fusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kini_2026_WACV, author = {Kini, Niraj Prakash and Tsai, Shiau-Rung and Lin, Guan-Hsun and Peng, Wen-Hsiao and Ma, Ching-Wen and Hwang, Jenq-Neng}, title = {milliMamba: Specular-Aware Human Pose Estimation via Dual mmWave Radar with Multi-Frame Mamba Fusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1481-1490} }
MIX-based Foreground and Background Patch Augmentation Guided by Physics and Material Properties for X-ray Detection-
[pdf]
[bibtex]@InProceedings{Liu_2026_WACV, author = {Liu, Xintong and Chang, Dongliang and Tong, Yujun and Ma, Zhanyu}, title = {MIX-based Foreground and Background Patch Augmentation Guided by Physics and Material Properties for X-ray Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {977-987} }
SGPMIL: Sparse Gaussian Process Multiple Instance Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lolos_2026_WACV, author = {Lolos, Andreas and Christodoulidis, Stergios and Moustakas, Aris L. and Dolz, Jose and Vakalopoulou, Maria}, title = {SGPMIL: Sparse Gaussian Process Multiple Instance Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {503-513} }
Beyond Real Weights: Hypercomplex Representations for Stable Quantization-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ibn_Ahad_2026_WACV, author = {Ibn Ahad, Jawad and Rahman, Maisha and Biswas, Amrijit and Kabir, Muhammad Rafsan and Krambroeckers, Robin and Momen, Sifat and Mohammed, Nabeel and Rahman, Shafin}, title = {Beyond Real Weights: Hypercomplex Representations for Stable Quantization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1180-1190} }
Uncertainty-Aware Subset Selection for Robust Visual Explainability under Distribution Shifts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gupta_2026_WACV, author = {Gupta, Madhav and Prasad, Vishak and Ramakrishnan, Ganesh}, title = {Uncertainty-Aware Subset Selection for Robust Visual Explainability under Distribution Shifts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1643-1652} }
Joint Modeling of Corruption-Driven and Information-Limited Uncertainty for Robust 3D Gaussian Splatting-
[pdf]
[bibtex]@InProceedings{Hui_2026_WACV, author = {Hui, Zeji and Gostar, Amirali Khodadadian and Chuah, WeiQin and Bab-Hadiashar, Alireza and Tennakoon, Ruwan}, title = {Joint Modeling of Corruption-Driven and Information-Limited Uncertainty for Robust 3D Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {688-697} }
iMotion-LLM: Instruction-Conditioned Trajectory Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Felemban_2026_WACV, author = {Felemban, Abdulwahab and Hroub, Nussair and Ding, Jian and Abdelrahman, Eslam and Shen, Xiaoqian and Mohamed, Abduallah and Elhoseiny, Mohamed}, title = {iMotion-LLM: Instruction-Conditioned Trajectory Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2710-2720} }
Inpaint360GS: Efficient Object-Aware 3D Inpainting via Gaussian Splatting for 360deg Scenes-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Shaoxiang and Zhang, Shihong and Millerdurai, Christen and Westermann, R\"udiger and Stricker, Didier and Pagani, Alain}, title = {Inpaint360GS: Efficient Object-Aware 3D Inpainting via Gaussian Splatting for 360deg Scenes}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {117-127} }
Model-free Domain Adaptation for Concealed Multimodal Large-Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Mitsuzumi_2026_WACV, author = {Mitsuzumi, Yu and Kimura, Akisato and Kashima, Hisashi}, title = {Model-free Domain Adaptation for Concealed Multimodal Large-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1231-1241} }
AD2: Analysis and Detection of Adversarial Threats in Visual Perception for End-to-End Autonomous Driving Systems-
[pdf]
[supp]
[bibtex]@InProceedings{Sahu_2026_WACV, author = {Sahu, Ishan and Hazra, Somnath and Aditya, Somak and Dey, Soumyajit}, title = {AD2: Analysis and Detection of Adversarial Threats in Visual Perception for End-to-End Autonomous Driving Systems}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1695-1704} }
BiPO: Bidirectional Partial Occlusion Network for Text-to-Motion Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hong_2026_WACV, author = {Hong, Seong-Eun and Lim, SooBin and Hwang, JuYeong and Chang, Minwook and Kang, HyeongYeop}, title = {BiPO: Bidirectional Partial Occlusion Network for Text-to-Motion Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {32-42} }
Color Bind: Exploring Color Perception in Text-to-Image Models-
[pdf]
[supp]
[bibtex]@InProceedings{Shomer-Chai_2026_WACV, author = {Shomer-Chai, Shay and Peng, Wenxuan and Hariharan, Bharath and Averbuch-Elor, Hadar}, title = {Color Bind: Exploring Color Perception in Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1916-1925} }
From Lightweight CNNs to SpikeNets: Benchmarking Accuracy-Energy Tradeoffs with Pruned Spiking SqueezeNet-
[pdf]
[arXiv]
[bibtex]@InProceedings{Bin_Kabir_2026_WACV, author = {Bin Kabir, Radib and Dipto, Tawsif Tashwar and Ahamed, Mehedi and Ahmed, Sabbir and Kabir, Md Hasanul}, title = {From Lightweight CNNs to SpikeNets: Benchmarking Accuracy-Energy Tradeoffs with Pruned Spiking SqueezeNet}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1137-1146} }
Enhancing Object Detection Training via Joint Image-Annotation Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Uziel_2026_WACV, author = {Uziel, Roy and Bialer, Oded}, title = {Enhancing Object Detection Training via Joint Image-Annotation Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1736-1745} }
DreamAnywhere: Object-Centric Panoramic 3D Scene Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Dominici_2026_WACV, author = {Dominici, Edoardo A. and Hladk\'y, Jozef and Verhoeven, Floor and Radl, Lukas and Deixelberger, Thomas and Ainetter, Stefan and Drescher, Philipp and Hauswiesner, Stefan and Coomans, Arno and Nazzaro, Giacomo and Vardis, Konstantinos and Steinberger, Markus}, title = {DreamAnywhere: Object-Centric Panoramic 3D Scene Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1-11} }
DiT-VTON: Diffusion Transformer Framework for Unified Multi-Category Virtual Try-On and Virtual Try-All with Integrated Image Editing-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Qi and Qiu, Shuwen and Koo, Kee Kiat and Han, Julien and Bouyarmane, Karim}, title = {DiT-VTON: Diffusion Transformer Framework for Unified Multi-Category Virtual Try-On and Virtual Try-All with Integrated Image Editing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {202-211} }
ObjectMeshDeform : Towards Recovering Precise 3D Geometry of Real Objects via Image-guided Mesh Deformation of 3D Generative Priors-
[pdf]
[supp]
[bibtex]@InProceedings{Katageri_2026_WACV, author = {Katageri, Siddharth and Sinha, Sanjana and Ghosh, Sourav and Maity, Soumyadip and Bhowmick, Brojeshwar}, title = {ObjectMeshDeform : Towards Recovering Precise 3D Geometry of Real Objects via Image-guided Mesh Deformation of 3D Generative Priors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2585-2595} }
Cluster-based Pseudo-labeling for Semi-Supervised LiDAR Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Guo_2026_WACV, author = {Guo, Qingju and Li, Shuang and Geng, Jing and Xie, Binhui and Shan, Jiawei and Li, Wei}, title = {Cluster-based Pseudo-labeling for Semi-Supervised LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {623-634} }
Memory-Augmented Representation for Efficient Event-based Visuomotor Policy Learning with Adaptive Perception and Control-
[pdf]
[bibtex]@InProceedings{Kamal_2026_WACV, author = {Kamal, Uday and Mukhopadhyay, Saibal}, title = {Memory-Augmented Representation for Efficient Event-based Visuomotor Policy Learning with Adaptive Perception and Control}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2596-2605} }
Accelerated Dose Generation in Gamma Knife Radiosurgery Using a Wavelet Diffusion Model for Sparse Representation-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Sangyoon and Mishra, Shubuendu and Watanabe, Yoichi}, title = {Accelerated Dose Generation in Gamma Knife Radiosurgery Using a Wavelet Diffusion Model for Sparse Representation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {917-926} }
Can We Challenge Open-Vocabulary Object Detectors with Generated Content in Street Scenes?-
[pdf]
[supp]
[bibtex]@InProceedings{Mutze_2026_WACV, author = {M\"utze, Annika and Ilyas, Sadia and D\"orpelkus, Christian and Rottmann, Matthias}, title = {Can We Challenge Open-Vocabulary Object Detectors with Generated Content in Street Scenes?}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {740-750} }
Autocorrelation-based Fiducial Markers for Traceability-
[pdf]
[supp]
[bibtex]@InProceedings{Bencheikh_2026_WACV, author = {Bencheikh, Ismail and Dunitz, Max and d'Autume, Marie and Meinhardt-Llopis, Enric and Pic, Marc and Facciolo, Gabriele and Mus\'e, Pablo}, title = {Autocorrelation-based Fiducial Markers for Traceability}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1345-1354} }
AutoSew: A Geometric Approach to Stitching Prediction with Graph Neural Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Rios-Navarro_2026_WACV, author = {R{\'\i}os-Navarro, Pablo and Garces, Elena and Lopez-Moreno, Jorge}, title = {AutoSew: A Geometric Approach to Stitching Prediction with Graph Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1374-1383} }
BoxSplitGen: A Generative Model for 3D Part Bounding Boxes in Varying Granularity-
[pdf]
[supp]
[bibtex]@InProceedings{Koo_2026_WACV, author = {Koo, Juil and Lin, Wei-Tung and Park, Chanho and Park, Chanhyeok and Sung, Minhyuk}, title = {BoxSplitGen: A Generative Model for 3D Part Bounding Boxes in Varying Granularity}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1777-1787} }
GeoHSAF: Geometric Hippocampus Shape Analysis Framework for Longitudinal Alzheimer's Disease Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Olaoluwa_2026_WACV, author = {Olaoluwa, Mubarak and Loukil, Heni and Sbei, Arafet and Drira, Hassen}, title = {GeoHSAF: Geometric Hippocampus Shape Analysis Framework for Longitudinal Alzheimer's Disease Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2156-2167} }
SilverLining: Data-First Mitigation of Spatial and Spectral Shortcuts Without Introducing New Confounders-
[pdf]
[supp]
[bibtex]@InProceedings{Unnikrishnan_2026_WACV, author = {Unnikrishnan, Balagopal and Brudno, Michael and McIntosh, Chris}, title = {SilverLining: Data-First Mitigation of Spatial and Spectral Shortcuts Without Introducing New Confounders}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1294-1303} }
Real-Time Tracking of Flexible Markers in Low-Contrast Fluoroscopy Using a Deep Neural Network Trained Solely on Synthetic Data-
[pdf]
[supp]
[bibtex]@InProceedings{Uchiyama_2026_WACV, author = {Uchiyama, Tomoki and Sakata, Yukinobu and Hirai, Ryusuke and Ishikawa, Hitoshi and Mori, Shinichiro}, title = {Real-Time Tracking of Flexible Markers in Low-Contrast Fluoroscopy Using a Deep Neural Network Trained Solely on Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2670-2679} }
Ordinal-Aware Multimodal Engagement Recognition for Collaborative Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Tran_2026_WACV, author = {Tran, Nha and Ly, Dat and Ta, Phi and Nguyen, Hung and Nguyen, Hien D.}, title = {Ordinal-Aware Multimodal Engagement Recognition for Collaborative Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2424-2433} }
TA-Prompting: Enhancing Video Large Language Models for Dense Video Captioning via Temporal Anchors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2026_WACV, author = {Cheng, Wei-Yuan and Chang, Kai-Po and Huang, Chi-Pin and Yang, Fu-En and Wang, Yu-Chiang Frank}, title = {TA-Prompting: Enhancing Video Large Language Models for Dense Video Captioning via Temporal Anchors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {225-235} }
Harnessing Object Grounding for Time-Sensitive Video Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2026_WACV, author = {Wu, Tz-Ying and Sridhar, Sharath Nittur and Tripathi, Subarna}, title = {Harnessing Object Grounding for Time-Sensitive Video Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2475-2484} }
OracleGS: Grounding Generative Priors for Sparse-View Gaussian Splatting-
[pdf]
[supp]
[bibtex]@InProceedings{Topaloglu_2026_WACV, author = {Topalo\u{g}lu, Atakan and Li, Kunyi and Niemeyer, Michael and Navab, Nassir and Tekalp, A. Murat and Tombari, Federico}, title = {OracleGS: Grounding Generative Priors for Sparse-View Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {77-87} }
DICE: Discrete Inversion Enabling Controllable Editing for Masked Generative Models-
[pdf]
[supp]
[bibtex]@InProceedings{He_2026_WACV, author = {He, Xiaoxiao and Dao, Quan and Han, Ligong and Wen, Song and Bai, Minhao and Liu, Di and Zhang, Han and Juefei-Xu, Felix and Tan, Chaowei and Liu, Bo and Min, Martin Renqiang and Li, Kang and Ahmed, Faez and Srivastava, Akash and Li, Hongdong and Huang, Junzhou and Metaxas, Dimitris N.}, title = {DICE: Discrete Inversion Enabling Controllable Editing for Masked Generative Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {762-772} }
Human Pose Aggregation for Multi-View Temporal Video Alignment-
[pdf]
[bibtex]@InProceedings{Delattre_2026_WACV, author = {Delattre, Fabien and Huang, Tsung-Wei and Su, Guan-Ming and Learned-Miller, Erik}, title = {Human Pose Aggregation for Multi-View Temporal Video Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {635-646} }
How to Design and Train Your Implicit Neural Representation for Video Compression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gwilliam_2026_WACV, author = {Gwilliam, Matthew and Zhang, Roy and Padmanabhan, Namitha and Du, Hongyang and Shrivastava, Abhinav}, title = {How to Design and Train Your Implicit Neural Representation for Video Compression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {729-739} }
CraftSVG: Multi-Object Text-to-SVG Synthesis via Layout Guided Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Banerjee_2026_WACV, author = {Banerjee, Ayan and Mathur, Nityanand and Llados, Josep and Pal, Umapada and Dutta, Anjan}, title = {CraftSVG: Multi-Object Text-to-SVG Synthesis via Layout Guided Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2564-2574} }
Trajectory Tactics: When Transformers Learn Exploration to Generate Online Signature-
[pdf]
[bibtex]@InProceedings{Pandey_2026_WACV, author = {Pandey, Anurag and Nigam, Aditya and Bhavsar, Arnav and Sharma, Ashutosh and Verma, Basu and Acharya, Divya and Amir, Mohd}, title = {Trajectory Tactics: When Transformers Learn Exploration to Generate Online Signature}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2306-2315} }
MageBench: Bridging Large Multimodal Models to Agents-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Miaosen and Dai, Qi and Yang, Yifan and Bao, Jianmin and Chen, Dongdong and Qiu, Kai and Luo, Chong and Geng, Xin and Guo, Baining}, title = {MageBench: Bridging Large Multimodal Models to Agents}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1415-1427} }
NerVast: Compression-Efficient Scaling of Implicit Neural Video Representations via Scene-based Parameter-sharing-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Yunheon and Ye, Juncheol and Kim, Jaehong and Han, Dongsu}, title = {NerVast: Compression-Efficient Scaling of Implicit Neural Video Representations via Scene-based Parameter-sharing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2616-2625} }
CAMP-VQA: Caption-Embedded Multimodal Perception for No-Reference Quality Assessment of Compressed Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Xinyi and Katsenou, Angeliki and Shen, Junxiao and Bull, David}, title = {CAMP-VQA: Caption-Embedded Multimodal Perception for No-Reference Quality Assessment of Compressed Video}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2042-2051} }
HyperPose: Hyper-pose Embeddings for 3D-Aware Generative Models with Self-Supervised Disentangling of Pose and Scene-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Mijeong and Kim, Namgi and Han, Bohyung}, title = {HyperPose: Hyper-pose Embeddings for 3D-Aware Generative Models with Self-Supervised Disentangling of Pose and Scene}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1011-1021} }
Mitigating Backdoor Attacks via Trigger Reconstruction and Model Hardening-
[pdf]
[supp]
[bibtex]@InProceedings{Tao_2026_WACV, author = {Tao, Guanhong and Cheng, Siyuan and Shen, Guangyu and Liu, Yingqi and An, Shengwei and Zhang, Zhuo and Wang, Zhenting and Guo, Hanxi and Zhang, Xiangyu}, title = {Mitigating Backdoor Attacks via Trigger Reconstruction and Model Hardening}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {580-590} }
Visibility guided Self-Supervised Occlusion-Resilient Human Pose Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Dutta_2026_WACV, author = {Dutta, Arindam and Bose, Sarosij and Kundu, Rohit and Ta, Calvin-Khang and Bachu, Saketh and Karydis, Konstantinos and Roy-Chowdhury, Amit K.}, title = {Visibility guided Self-Supervised Occlusion-Resilient Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1054-1063} }
Feature-Disentangling RGB-NIR Fusion Network for Remote Driver Physiological Measurement-
[pdf]
[supp]
[bibtex]@InProceedings{Bouraffa_2026_WACV, author = {Bouraffa, Tayssir and Wang, Ziyuan and Str\"uber, Daniel}, title = {Feature-Disentangling RGB-NIR Fusion Network for Remote Driver Physiological Measurement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {657-666} }
CommonForms: A Large, Diverse Dataset for Form Field Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Barrow_2026_WACV, author = {Barrow, Joe}, title = {CommonForms: A Large, Diverse Dataset for Form Field Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1170-1179} }
OpenLVLM-MIA: A Controlled Benchmark Revealing the Limits of Membership Inference Attacks on Large Vision-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Miyamoto_2026_WACV, author = {Miyamoto, Ryoto and Fan, Xin and Kido, Fuyuko and Matsumoto, Tsuneo and Yamana, Hayato}, title = {OpenLVLM-MIA: A Controlled Benchmark Revealing the Limits of Membership Inference Attacks on Large Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2680-2689} }
QCFace: Image Quality Control for boosting Face Representation & Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Doan-Ngo_2026_WACV, author = {Doan-Ngo, Duc-Phuong and Diep, Thanh-Dang and Nguyen-Duc, Thanh and LE, Thanh-Sach and Thoai, Nam}, title = {QCFace: Image Quality Control for boosting Face Representation \& Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1501-1511} }
False Alarm Rectification for Early Smoke Segmentation-
[pdf]
[bibtex]@InProceedings{Zhao_2026_WACV, author = {Zhao, Hongjin and Li, Weihao and Ji, Ge-Peng and Barnes, Nick}, title = {False Alarm Rectification for Early Smoke Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1969-1978} }
DMAT: An End-to-End Framework for Joint Atmospheric Turbulence Mitigation and Object Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hill_2026_WACV, author = {Hill, Paul and Liu, Zhiming and Achim, Alin and Bull, David and Anantrasirichai, Nantheera}, title = {DMAT: An End-to-End Framework for Joint Atmospheric Turbulence Mitigation and Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2690-2699} }
ViGG: Robust RGB-D Point Cloud Registration using Visual-Geometric Mutual Guidance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Congjia and Yan, Shen and Qu, Yufu}, title = {ViGG: Robust RGB-D Point Cloud Registration using Visual-Geometric Mutual Guidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {816-826} }
Revisiting Layer Normalization for Point Cloud Test Time Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Yazdanpanah_2026_WACV, author = {Yazdanpanah, Moslem and Bahri, Ali and Noori, Mehrdad and Dastani, Sahar and Barbeau, Samuel and Osowiechi, David and Hakim, Gustavo Adolfo Vargas and Ben Ayed, Ismail and Desrosiers, Christian}, title = {Revisiting Layer Normalization for Point Cloud Test Time Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {537-546} }
LooC: Effective Low-Dimensional Codebook for Compositional Vector Quantization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Jie and Wong, Kwan-Yee K. and Han, Kai}, title = {LooC: Effective Low-Dimensional Codebook for Compositional Vector Quantization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {160-170} }
A-V Representation Learning via Audio Shift Prediction for Multimodal Deepfake Detection and Temporal Localization-
[pdf]
[supp]
[bibtex]@InProceedings{Anshul_2026_WACV, author = {Anshul, Ashutosh and Chng, Eng Siong and Rajan, Deepu}, title = {A-V Representation Learning via Audio Shift Prediction for Multimodal Deepfake Detection and Temporal Localization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2553-2563} }
3D Gaussian Point Encoders-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{James_2026_WACV, author = {James, Jim and Wilson, Benjamin and Lucey, Simon and Hays, James}, title = {3D Gaussian Point Encoders}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1788-1797} }
CVP: Central-Peripheral Vision-Inspired Multimodal Model for Spatial Reasoning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Zeyuan and Zhang, Xiang and Xu, Haiyang and Xie, Jianwen and Tu, Zhuowen}, title = {CVP: Central-Peripheral Vision-Inspired Multimodal Model for Spatial Reasoning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2295-2305} }
Not Like Transformers: Drop the Beat Representation for Dance Generation with Mamba-Based Diffusion Model-
[pdf]
[supp]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Sangjune and Choi, Inhyeok and Soon, Donghyeon and Jeon, Youngwoo and Joo, Kyungdon}, title = {Not Like Transformers: Drop the Beat Representation for Dance Generation with Mamba-Based Diffusion Model}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1767-1776} }
Odo: Depth-Guided Diffusion for Identity-Preserving Body Reshaping-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Khandelwal_2026_WACV, author = {Khandelwal, Siddharth and Kamath, Sridhar and Jain, Arjun}, title = {Odo: Depth-Guided Diffusion for Identity-Preserving Body Reshaping}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {22-31} }
FAST-EQA: Efficient Embodied Question Answering with Global and Local Region Relevancy-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Haochen and Savaliya, Nirav and Siddiqui, Faizan and Sachdeva, Enna}, title = {FAST-EQA: Efficient Embodied Question Answering with Global and Local Region Relevancy}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1664-1673} }
FARF-Net: Frequency-guided Adaptive Receptive Field Network for Edge-enhanced Polyp Segmentation-
[pdf]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Xue and Jiang, Aiwen and Yu, Hongqian and Xiao, Yang}, title = {FARF-Net: Frequency-guided Adaptive Receptive Field Network for Edge-enhanced Polyp Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2338-2347} }
Text Slider: Efficient and Plug-and-Play Continuous Concept Control for Image/Video Synthesis via LoRA Adapters-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chiu_2026_WACV, author = {Chiu, Pin-Yen and Fang, I-Sheng and Chen, Jun-Cheng}, title = {Text Slider: Efficient and Plug-and-Play Continuous Concept Control for Image/Video Synthesis via LoRA Adapters}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {613-622} }
Beyond Realism: Learning the Art of Expressive Composition with StickerNet-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lu_2026_WACV, author = {Lu, Haoming and Kocharian, David and Shi, Humphrey}, title = {Beyond Realism: Learning the Art of Expressive Composition with StickerNet}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {869-878} }
ClusterMine: Robust Label-Free Visual Out-Of-Distribution Detection via Concept Mining from Text Corpora-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Adaloglou_2026_WACV, author = {Adaloglou, Nikolas and Petrusheva, Diana and Asker, Mohamed and Michels, Felix and Kollmann, Markus}, title = {ClusterMine: Robust Label-Free Visual Out-Of-Distribution Detection via Concept Mining from Text Corpora}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1999-2010} }
LENVIZ: A High-Resolution Low-Exposure Night Vision Benchmark Dataset-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Aithal_2026_WACV, author = {Aithal, Manjushree and VidalMata, Rosaura G and Kartha, Manikandtan and Chen, Gong and Adhikarla, Eashan and Kirsten, Lucas Nedel and Fu, Zhicheng and Madhusudhana, Nikhil Ambha and Nasti, Joseph V.}, title = {LENVIZ: A High-Resolution Low-Exposure Night Vision Benchmark Dataset}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2531-2540} }
MARS: a Multimodal Alignment and Ranking System for Few-Shot Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Catalano_2026_WACV, author = {Catalano, Nico and Samele, Stefano and Pertino, Paolo and Matteucci, Matteo}, title = {MARS: a Multimodal Alignment and Ranking System for Few-Shot Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1284-1293} }
DreamMakeup: Face Makeup Customization using Latent Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Geon Yeong and Han, Inhwa and Yang, Serin and Hong, Yeobin and Jeong, Seongmin and Jeon, Heechan and Goh, Myeongjin and Yi, Sung Won and Nam, Jin and Ye, Jong Chul}, title = {DreamMakeup: Face Makeup Customization using Latent Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {422-430} }
Morphing Through Time: Diffusion-Based Bridging of Temporal Gaps for Robust Alignment in Change Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Madani_2026_WACV, author = {Madani, Seyedehanita and Patel, Vishal M.}, title = {Morphing Through Time: Diffusion-Based Bridging of Temporal Gaps for Robust Alignment in Change Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {431-439} }
DiRe: Diversity-promoting Regularization for Dataset Condensation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mohanty_2026_WACV, author = {Mohanty, Saumyaranjan and Reddy, Aravind and Mopuri, Konda Reddy}, title = {DiRe: Diversity-promoting Regularization for Dataset Condensation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2818-2827} }
Federated Model Synchronization for Diagnostic Redefinition through a Novel Selective Parameter Unlearning-
[pdf]
[supp]
[bibtex]@InProceedings{Kundalwal_2026_WACV, author = {Kundalwal, Mayank Kumar and Mamta, Mamta and Mishra, Deepak and Ekbal, Asif}, title = {Federated Model Synchronization for Diagnostic Redefinition through a Novel Selective Parameter Unlearning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1395-1404} }
Diffusion-Based Authentication of Copy Detection Patterns: A Multimodal Framework with Printer Signature Conditioning-
[pdf]
[bibtex]@InProceedings{Atoki_2026_WACV, author = {Atoki, Bolutife and Tkachenko, Iuliia and Kerautret, Bertrand and Junior, Carlos Crispim}, title = {Diffusion-Based Authentication of Copy Detection Patterns: A Multimodal Framework with Printer Signature Conditioning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1685-1694} }
MorphXAI: An Explainable Framework for Morphological Analysis of Parasites in Blood Smear Images-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yousaf_2026_WACV, author = {Yousaf, Aqsa and Win, Sint Sint and Coffee, Megan and Olufowobi, Habeeb}, title = {MorphXAI: An Explainable Framework for Morphological Analysis of Parasites in Blood Smear Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2125-2134} }
Multimodal Medical Image Binding via Shared Text Embeddings-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2026_WACV, author = {Liu, Yunhao and Xi, Suyang and Liu, Shiqi and Ding, Hong and Jin, Chicheng and Zhong, Chong and He, Junjun and Liu, Catherine C. and Shen, Yiqing}, title = {Multimodal Medical Image Binding via Shared Text Embeddings}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1610-1620} }
RAT4D: Rig and Animate Objects without Surface Templates in 4D-
[pdf]
[supp]
[bibtex]@InProceedings{Dabhi_2026_WACV, author = {Dabhi, Mosam and Lucey, Simon and Jeni, Laszlo A.}, title = {RAT4D: Rig and Animate Objects without Surface Templates in 4D}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {393-401} }
Reinforcement Learning-based Adaptive Control of Classifier-Free Guidance and Timestep Embeddings in Diffusion Models-
[pdf]
[bibtex]@InProceedings{You_2026_WACV, author = {You, Haochen and Liu, Baojing and He, Hongyang}, title = {Reinforcement Learning-based Adaptive Control of Classifier-Free Guidance and Timestep Embeddings in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {43-53} }
From Few-Shot to Zero-Shot Pallet Load Recognition: A Deployed Embedding-Based Vision System for Industrial Logistics-
[pdf]
[supp]
[bibtex]@InProceedings{del_Olmo_2026_WACV, author = {del Olmo, Juan Jes\'us Losada and Ballesteros, Emilio Pardo and L\'opez-de-Teruel, Pedro E. and Ruiz, Alberto}, title = {From Few-Shot to Zero-Shot Pallet Load Recognition: A Deployed Embedding-Based Vision System for Industrial Logistics}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2901-2911} }
AFRAgent : An Adaptive Feature Renormalization Based High Resolution Aware GUI agent-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Anand_2026_WACV, author = {Anand, Neeraj and Jain, Rishabh and Patnaik, Sohan and Krishnamurthy, Balaji and Sarkar, Mausoom}, title = {AFRAgent : An Adaptive Feature Renormalization Based High Resolution Aware GUI agent}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1147-1158} }
SUGAR: A Sweeter Spot for Generative Unlearning of Many Identities-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Dung Thuy and Nguyen, Quang and Robinette, Preston K. and Jiang, Eli and Johnson, Taylor T. and Leach, Kevin}, title = {SUGAR: A Sweeter Spot for Generative Unlearning of Many Identities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2731-2740} }
mmWEAVER: Environment-Specific mmWave Signal Synthesis from a Photo and Activity Description-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Monjur_2026_WACV, author = {Monjur, Mahathir and Nirjon, Shahriar}, title = {mmWEAVER: Environment-Specific mmWave Signal Synthesis from a Photo and Activity Description}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1875-1884} }
Overcoming Fine-Grained Visual Challenges in Animal Re-Identification via Semantic Feature Alignment-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2026_WACV, author = {Wu, Yihao and Zhao, Di and Li, Yuzhuo and Alajas, Matthew and Glen, Alistair S. and Zhang, Jingfeng and Dobbie, Gillian and Wilson, Daniel and Koh, Yun Sing}, title = {Overcoming Fine-Grained Visual Challenges in Animal Re-Identification via Semantic Feature Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {371-381} }
Narrating For You: Prompt-guided Audio-visual Narrating Face Generation Employing Multi-entangled Latent Space-
[pdf]
[supp]
[bibtex]@InProceedings{K_2026_WACV, author = {K, Aashish Chandra and A V, Aashutosh and Das, Abhijit}, title = {Narrating For You: Prompt-guided Audio-visual Narrating Face Generation Employing Multi-entangled Latent Space}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1314-1323} }
Semi-Supervised Hierarchical Open-Set Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wallin_2026_WACV, author = {Wallin, Erik and Kahl, Fredrik and Hammarstrand, Lars}, title = {Semi-Supervised Hierarchical Open-Set Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1989-1998} }
BrightRate: Quality Assessment for User-Generated HDR Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Saini_2026_WACV, author = {Saini, Shreshth and Chen, Bowen and Wang, Yilin and Birkbeck, Neil and Adsumilli, Balu and Bovik, Alan C.}, title = {BrightRate: Quality Assessment for User-Generated HDR Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1522-1532} }
PHYSPLAT: a Framework for Photorealistic Hybrid Simulation of Real and Synthetic Elements using 3D Gaussian Splatting-
[pdf]
[supp]
[bibtex]@InProceedings{Alfonso-Arsuaga_2026_WACV, author = {Alfonso-Arsuaga, Mario and Dominguez-Elvira, Henar and Casas-Guerrero, Jorge and Castiella-Aguirrezabala, Andrea and Dom{\'\i}nguez, Lorenzo Cost\'abile and Garc{\'\i}a-Gonz\'alez, Jorge and Naranjo-Almeida, Maria and Comino-Trinidad, Marc and Lopez-Moreno, Jorge}, title = {PHYSPLAT: a Framework for Photorealistic Hybrid Simulation of Real and Synthetic Elements using 3D Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1621-1631} }
One-Shot Fine-Grained Re-Identification of Paint Marked Honey Bees using Vision Foundation Models-
[pdf]
[bibtex]@InProceedings{Meyers_2026_WACV, author = {Meyers, Luke and Rodr{\'\i}guez-Cordero, Josu\'e A. and M\'egret, R\'emi}, title = {One-Shot Fine-Grained Re-Identification of Paint Marked Honey Bees using Vision Foundation Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {560-569} }
PaRaChute: Pathology-Radiology Cross-Modal Fusion for Missing-Modality-Robust Survival Prediction-
[pdf]
[supp]
[bibtex]@InProceedings{Caforio_2026_WACV, author = {Caforio, Pietro and Poles, Isabella and Santambrogio, Marco D.}, title = {PaRaChute: Pathology-Radiology Cross-Modal Fusion for Missing-Modality-Robust Survival Prediction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {718-728} }
From Street to Orbit: Training-Free Cross-View Retrieval via Location Semantics and LLM Guidance-
[pdf]
[arXiv]
[bibtex]@InProceedings{Min_2026_WACV, author = {Min, Jeongho and Kim, Dongyoung and Lee, Jaehyup}, title = {From Street to Orbit: Training-Free Cross-View Retrieval via Location Semantics and LLM Guidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {570-579} }
MSRTrack: LLM-Powered Object Tracking with Motion and Semantic Reasoning-
[pdf]
[bibtex]@InProceedings{Shen_2026_WACV, author = {Shen, Tong and Wang, Di and Moura, Jos\'e M. F.}, title = {MSRTrack: LLM-Powered Object Tracking with Motion and Semantic Reasoning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {838-848} }
MarineEval: Assessing the Marine Intelligence of Vision-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wong_2026_WACV, author = {Wong, Yuk Kwan and To, Tuan-An and Zhang, Jipeng and Zheng, Ziqiang and Yeung, Sai-Kit}, title = {MarineEval: Assessing the Marine Intelligence of Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1459-1470} }
MMHOI: Modeling Complex 3D Multi-Human Multi-Object Interactions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kogashi_2026_WACV, author = {Kogashi, Kaen and Cherian, Anoop and Kuo, Meng-Yu Jennifer}, title = {MMHOI: Modeling Complex 3D Multi-Human Multi-Object Interactions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1512-1521} }
MomentMix Augmentation with Length-Aware DETR for Temporally Robust Moment Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Seojeong and Choi, Jiho and Baek, Kyungjune and Shim, Hyunjung}, title = {MomentMix Augmentation with Length-Aware DETR for Temporally Robust Moment Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1127-1136} }
SasMamba: A Lightweight Structure-Aware Stride State Space Model for 3D Human Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cui_2026_WACV, author = {Cui, Hu and Hua, Wenqiang and Huang, Renjing and Jia, Shurui and Hayama, Tessai}, title = {SasMamba: A Lightweight Structure-Aware Stride State Space Model for 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2721-2730} }
Action Anticipation at a Glimpse: To What Extent Can Multimodal Cues Replace Video?-
[pdf]
[supp]
[bibtex]@InProceedings{Benavent-Lledo_2026_WACV, author = {Benavent-Lledo, Manuel and Bacharidis, Konstantinos and Manousaki, Victoria and Papoutsakis, Konstantinos and Argyros, Antonis and Garcia-Rodriguez, Jose}, title = {Action Anticipation at a Glimpse: To What Extent Can Multimodal Cues Replace Video?}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {276-286} }
Systematic Analysis of the Unintentional CSAM-Generation-Potential of Text-to-Image Models-
[pdf]
[bibtex]@InProceedings{Goller_2026_WACV, author = {G\"oller, Nicolas and Steinebach, Martin}, title = {Systematic Analysis of the Unintentional CSAM-Generation-Potential of Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {493-502} }
Towards Fast and Scalable Normal Integration using Continuous Components-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Milano_2026_WACV, author = {Milano, Francesco and Chung, Jen Jen and Ott, Lionel and Siegwart, Roland}, title = {Towards Fast and Scalable Normal Integration using Continuous Components}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {236-244} }
ViSTA: Visual Storytelling using Multi-modal Adapters for Text-to-Image Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2026_WACV, author = {Dong, Sibo and Shaheen, Ismail and Shen, Maggie and Mallick, Rupayan and Bargal, Sarah Adel}, title = {ViSTA: Visual Storytelling using Multi-modal Adapters for Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {12-21} }
Data-Driven Lipschitz Continuity: A Cost-Effective Approach to Improve Adversarial Robustness-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Erh-Chung and Chen, Pin-Yu and Chung, I-Hsin and Lee, Che-Rung}, title = {Data-Driven Lipschitz Continuity: A Cost-Effective Approach to Improve Adversarial Robustness}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {698-707} }
A Fast, Simple, and Flexible Scale Informative Feature Transform Module for Arbitrary Scale Image Super-Resolution-
[pdf]
[supp]
[bibtex]@InProceedings{Kar_2026_WACV, author = {Kar, Aupendu and Biswas, Prabir Kumar}, title = {A Fast, Simple, and Flexible Scale Informative Feature Transform Module for Arbitrary Scale Image Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1405-1414} }
Human Knowledge Integrated Multi-modal Learning for Single Source Domain Generalization-
[pdf]
[supp]
[bibtex]@InProceedings{Banerjee_2026_WACV, author = {Banerjee, Ayan and Thakur, Kuntal and Gupta, Sandeep}, title = {Human Knowledge Integrated Multi-modal Learning for Single Source Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2380-2391} }
AFL-PRF: Adaptive Federated Learning for Low-Quality Data: Enhancing Performance, Robustness, and Fairness-
[pdf]
[bibtex]@InProceedings{Yu_2026_WACV, author = {Yu, Pinrui and Xie, Yiming and Ye, Longtian and Yuan, Geng and Mi, Ningfang and Lin, Xue}, title = {AFL-PRF: Adaptive Federated Learning for Low-Quality Data: Enhancing Performance, Robustness, and Fairness}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {402-411} }
CountingDINO: A Training-free Pipeline for Class-Agnostic Counting using Unsupervised Backbones-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pacini_2026_WACV, author = {Pacini, Giacomo and Bianchi, Lorenzo and Ciampi, Luca and Messina, Nicola and Amato, Giuseppe and Falchi, Fabrizio}, title = {CountingDINO: A Training-free Pipeline for Class-Agnostic Counting using Unsupervised Backbones}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {806-815} }
FAE-Net: Fashion Attribute Editing via Disentangled Latent Conditioning in Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Bhargav_2026_WACV, author = {Bhargav, P. Rajith and Bhattacharya, Gaurab and Vivek, B S and Gubbi, Jayavardhana}, title = {FAE-Net: Fashion Attribute Editing via Disentangled Latent Conditioning in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {192-201} }
SCORP: Scene-Consistent Object Refinement via Proxy Generation and Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Ziwei and Liu, Ziling and Huang, Zitong and Gao, Mingqi and Zheng, Feng}, title = {SCORP: Scene-Consistent Object Refinement via Proxy Generation and Tuning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {795-805} }
The Perceptual Observatory Characterizing Robustness and Grounding in MLLMs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Anvekar_2026_WACV, author = {Anvekar, Tejas and Bardoliya, Fenil and Turaga, Pavan K. and Baral, Chitta and Gupta, Vivek}, title = {The Perceptual Observatory Characterizing Robustness and Grounding in MLLMs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1653-1663} }
Seeing is Believing (and Predicting): Context-Aware Multi-Human Behavior Prediction with Vision Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Panchal_2026_WACV, author = {Panchal, Utsav and Liu, Yuchen and Palmieri, Luigi and Georgievski, Ilche and Aiello, Marco}, title = {Seeing is Believing (and Predicting): Context-Aware Multi-Human Behavior Prediction with Vision Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1959-1968} }
MAESTRO: Masked AutoEncoders for Multimodal, Multitemporal, and Multispectral Earth Observation Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Labatie_2026_WACV, author = {Labatie, Antoine and Vaccaro, Michael and Lardiere, Nina and Garioud, Anatol and Gonthier, Nicolas}, title = {MAESTRO: Masked AutoEncoders for Multimodal, Multitemporal, and Multispectral Earth Observation Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {212-224} }
ASC: Learning Augmentation Severity-Consistent Representations Improves Generalization via Augmentation Search-
[pdf]
[supp]
[bibtex]@InProceedings{Alamdar_2026_WACV, author = {Alamdar, Amirhossein and Jafarinia, Hossein and Noori, Mahdi and Rohban, Mohammad Hossein}, title = {ASC: Learning Augmentation Severity-Consistent Representations Improves Generalization via Augmentation Search}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1926-1936} }
Learning to Animate Images from A Few Videos to Portray Delicate Human Actions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Haoxin and Yu, Yingchen and Wu, Qilong and Zhang, Hanwang and Bai, Song and Li, Boyang}, title = {Learning to Animate Images from A Few Videos to Portray Delicate Human Actions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {547-559} }
UniCalib: Targetless LiDAR-camera Calibration via Probabilistic Flow on Unified Depth Representations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2026_WACV, author = {Han, Shu and Zhu, Xubo and Wu, Ji and Cai, Ximeng and Yang, Wen and Yu, Huai and Xia, Gui-Song}, title = {UniCalib: Targetless LiDAR-camera Calibration via Probabilistic Flow on Unified Depth Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1906-1915} }
Beyond the Highlights: Video Retrieval with Salient and Surrounding Contexts-
[pdf]
[supp]
[bibtex]@InProceedings{Bang_2026_WACV, author = {Bang, Jaehun and Ye-Bin, Moon and Oh, Tae-Hyun and Joo, Kyungdon}, title = {Beyond the Highlights: Video Retrieval with Salient and Surrounding Contexts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2188-2197} }
PiSA: A Self-Augmented Data Engine and Training Strategy for 3D Understanding with Large Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guo_2026_WACV, author = {Guo, Zilu and Lin, Hongbin and Yuan, Zhihao and Zheng, Chaoda and Qiu, Pengshuo and Jiang, Dongzhi and Zhang, Renrui and Feng, Chun-Mei and Li, Zhen}, title = {PiSA: A Self-Augmented Data Engine and Training Strategy for 3D Understanding with Large Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1273-1283} }
Analysis of Text Accuracy and Visual Alignment in Vision-Language Models for Artistic Text Generation-
[pdf]
[bibtex]@InProceedings{Alderazi_2026_WACV, author = {Alderazi, Fatima and Alfarraj, Motaz}, title = {Analysis of Text Accuracy and Visual Alignment in Vision-Language Models for Artistic Text Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {879-887} }
Do Generative Video Models Understand Physical Principles?-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Motamed_2026_WACV, author = {Motamed, Saman and Culp, Laura and Swersky, Kevin and Jaini, Priyank and Geirhos, Robert}, title = {Do Generative Video Models Understand Physical Principles?}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {948-958} }
AnyBald: Toward Realistic Diffusion-Based Hair Removal In-The-Wild-
[pdf]
[supp]
[bibtex]@InProceedings{Choi_2026_WACV, author = {Choi, Yongjun and Han, Seungoh and Kim, Soomin and Son, Sumin and Rohani, Mohsen and Maucourant, Edgar and Min, Dongbo and Joo, Kyungdon}, title = {AnyBald: Toward Realistic Diffusion-Based Hair Removal In-The-Wild}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2220-2230} }
A Multi-Agent Diffusion Approach for MRI Anomaly Segmentation via Modality-Specific LoRA Specialization-
[pdf]
[bibtex]@InProceedings{Al_Ghallabi_2026_WACV, author = {Al Ghallabi, Wafa and Zaheer, Muhammad Zaigham and Thawkar, Ritesh and Thawakar, Omkar and Khan, Salman and Khan, Fahad Shahbaz}, title = {A Multi-Agent Diffusion Approach for MRI Anomaly Segmentation via Modality-Specific LoRA Specialization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {128-137} }
ZonUI-3B: Competitive GUI Grounding with a 3B VLM Trained on a Single Consumer GPU-
[pdf]
[supp]
[bibtex]@InProceedings{Hsieh_2026_WACV, author = {Hsieh, ZongHan and Yang, ShengJing and Wei, Tzer-Jen}, title = {ZonUI-3B: Competitive GUI Grounding with a 3B VLM Trained on a Single Consumer GPU}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {959-966} }
Sketch2Stitch: GANs for Abstract Sketch-Based Dress Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Khan_2026_WACV, author = {Khan, Faizan Farooq and Bakr, Eslam Abdelrahman and Morelli, Davide and Cornia, Marcella and Cucchiara, Rita and Elhoseiny, Mohamed}, title = {Sketch2Stitch: GANs for Abstract Sketch-Based Dress Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2209-2219} }
You May Speak Freely: Improving the Fine-Grained Visual Recognition Capabilities of Multimodal Large Language Models with Answer Extraction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lawrence_2026_WACV, author = {Lawrence, Logan and Saha, Oindrila and Wei, Megan and Sun, Chen and Maji, Subhransu and Van Horn, Grant}, title = {You May Speak Freely: Improving the Fine-Grained Visual Recognition Capabilities of Multimodal Large Language Models with Answer Extraction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1428-1437} }
Evaluating Text-to-Image and Text-to-Video Synthesis with a Conditional Frechet Distance-
[pdf]
[supp]
[bibtex]@InProceedings{Koo_2026_WACV, author = {Koo, Jaywon and Hernandez, Jefferson and Haji-Ali, Moayed and Yang, Ziyan and Ordonez, Vicente}, title = {Evaluating Text-to-Image and Text-to-Video Synthesis with a Conditional Frechet Distance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2052-2062} }
mEOL: Training-Free Instruction-Guided Multimodal Embedder for Vector Graphics and Image Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Kyeong Seon and Seong-Eun, Baek and Jung-Mok, Lee and Oh, Tae-Hyun}, title = {mEOL: Training-Free Instruction-Guided Multimodal Embedder for Vector Graphics and Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1191-1200} }
GateFusion: Hierarchical Gated Cross-Modal Fusion for Active Speaker Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Yu and Ha, Juhyung and Ramirez, Frangil M. and Wang, Yuchen and Crandall, David J.}, title = {GateFusion: Hierarchical Gated Cross-Modal Fusion for Active Speaker Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1074-1083} }
Detection-Driven Object Count Optimization for Text-to-Image Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zafar_2026_WACV, author = {Zafar, Oz and Cohen, Yuval and Wolf, Lior and Schwartz, Idan}, title = {Detection-Driven Object Count Optimization for Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1885-1894} }
Fully Unsupervised Self-debiasing of Text-to-Image Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Vardhana_2026_WACV, author = {Vardhana, Korada Sri and Lolla, Shrikrishna and Biswas, Soma}, title = {Fully Unsupervised Self-debiasing of Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1221-1230} }
Salience-SGG: Enhancing Unbiased Scene Graph Generation with Iterative Salience Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qu_2026_WACV, author = {Qu, Runfeng and Hall, Ole and Bideau, Pia K and Ouerfelli-Ethier, Julie and Rolfs, Martin and Obermayer, Klaus and Hellwich, Olaf}, title = {Salience-SGG: Enhancing Unbiased Scene Graph Generation with Iterative Salience Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1032-1042} }
SPAR-Det: Segmentation-guided and Prior-Aided Routing for Small Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Kwon_2026_WACV, author = {Kwon, Seungchan and Lim, Gyuil and Han, Youngjoon}, title = {SPAR-Det: Segmentation-guided and Prior-Aided Routing for Small Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2146-2155} }
Mitigating the Modality Gap: Few-Shot Out-of-Distribution Detection with Multi-modal Prototypes and Image Bias Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Yimu and Riddell, Evelien and Chow, Adrian and Sedwards, Sean and Czarnecki, Krzysztof}, title = {Mitigating the Modality Gap: Few-Shot Out-of-Distribution Detection with Multi-modal Prototypes and Image Bias Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2741-2751} }
SymNet: A Multi-Task Network for Joint Radio Map Reconstruction and Transmitter Localization-
[pdf]
[bibtex]@InProceedings{Ye_2026_WACV, author = {Ye, Lyuzhou and Le, Thanh Dat and Huang, Yan}, title = {SymNet: A Multi-Task Network for Joint Radio Map Reconstruction and Transmitter Localization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {150-159} }
3DSceneEditor: Controllable 3D Scene Editing with Gaussian Splatting-
[pdf]
[supp]
[bibtex]@InProceedings{Yan_2026_WACV, author = {Yan, Ziyang and Shao, Yihua and Liao, Minwen and Chen, Siyu and Wang, Nan and Lin, Muyuan and Hwang, Jenq-Neng and Zhao, Hao and Remondino, Fabio and Li, Lei}, title = {3DSceneEditor: Controllable 3D Scene Editing with Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1852-1863} }
Matching Semantically Similar Non-Identical Objects-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Marumo_2026_WACV, author = {Marumo, Yusuke and Kawamoto, Kazuhiko and Tanaka, Satomi and Hirano, Shigenobu and Kera, Hiroshi}, title = {Matching Semantically Similar Non-Identical Objects}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2752-2764} }
Pyramidal Spectrum: Frequency-based Hierarchically Vector Quantized VAE for Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Prakash_2026_WACV, author = {Prakash, Tushar and Susladkar, Onkar and Mittal, Sparsh and Dhillon, Inderjit S}, title = {Pyramidal Spectrum: Frequency-based Hierarchically Vector Quantized VAE for Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2073-2082} }
Learning Mask-Aware Offsets: Two-branch Deformable Attention Networks for Inpainting with Masked Region Avoidance-
[pdf]
[supp]
[bibtex]@InProceedings{Oh_2026_WACV, author = {Oh, Hyeongseok and Paik, Joonki}, title = {Learning Mask-Aware Offsets: Two-branch Deformable Attention Networks for Inpainting with Masked Region Avoidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1022-1031} }
QuadraNet V2: Efficient and Sustainable Training of High-Order Neural Networks with Quadratic Adaptation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xu_2026_WACV, author = {Xu, Chenhui and Yu, Fuxun and Xiong, Jinjun and Chen, Xiang}, title = {QuadraNet V2: Efficient and Sustainable Training of High-Order Neural Networks with Quadratic Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1365-1373} }
Personalized Image Privacy Advisors via Federated Daisy-Chaining-
[pdf]
[supp]
[bibtex]@InProceedings{Banerjee_2026_WACV, author = {Banerjee, Sourasekhar and Subramaniam, Vengateswaran and Roy, Debaditya and Subbaraju, Vigneshwaran and Bhuyan, Monowar}, title = {Personalized Image Privacy Advisors via Federated Daisy-Chaining}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2808-2817} }
Prompt-OT: An Optimal Transport Regularization Paradigm for Knowledge Preservation in Vision-Language Model Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Xiwen and Zhu, Wenhui and Qiu, Peijie and Wang, Hao and Li, Huayu and Wu, Haiyu and Dong, Xuanzhao and Sotiras, Aristeidis and Wang, Yalin and Razi, Abolfazl}, title = {Prompt-OT: An Optimal Transport Regularization Paradigm for Knowledge Preservation in Vision-Language Model Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {667-676} }
SCORE: Soft Label Compression-Centric Dataset Condensation via Coding Rate Optimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yuan_2026_WACV, author = {Yuan, Bowen and Fu, Yuxia and Wang, Zijian and Luo, Yadan and Huang, Zi}, title = {SCORE: Soft Label Compression-Centric Dataset Condensation via Coding Rate Optimization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2198-2208} }
BAFIS: Dataset + Framework to Assess Occupational Bias and Human Preference in Modern Text-to-image Models-
[pdf]
[supp]
[bibtex]@InProceedings{Klassert_2026_WACV, author = {Klassert, Thomas and Ulges, Adrian and Fu, Biying}, title = {BAFIS: Dataset + Framework to Assess Occupational Bias and Human Preference in Modern Text-to-image Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2168-2177} }
Cosine Similarity is Almost All You Need (for Prototypical-Part Models)-
[pdf]
[supp]
[bibtex]@InProceedings{Moffett_2026_WACV, author = {Moffett, Luke and Willard, Frank and Machado, Maximillian and Mokel, Emmanuel and Donnelly, Jon and Guo, Zhicheng and Costarino, Adam and Yang, Julia and Kim, Giyoung and Barnett, Alina Jade and Rudin, Cynthia}, title = {Cosine Similarity is Almost All You Need (for Prototypical-Part Models)}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1586-1596} }
Illuminating Darkness: Learning to Enhance Low-light Images In-the-Wild-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sharif_2026_WACV, author = {Sharif, S. M. A. and Rehman, Abdur and Abidin, Zain Ul and Dharejo, Fayaz Ali and Timofte, Radu and Naqvi, Rizwan Ali}, title = {Illuminating Darkness: Learning to Enhance Low-light Images In-the-Wild}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2263-2272} }
Imitating the Functionality of Image-to-Image Models Using a Single Example-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Spingarn_2026_WACV, author = {Spingarn, Nurit and Michaeli, Tomer}, title = {Imitating the Functionality of Image-to-Image Models Using a Single Example}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2178-2187} }
ArchitectHead: Continuous Level of Detail Control for 3D Gaussian Head Avatars-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yan_2026_WACV, author = {Yan, Peizhi and Ward, Rabab and Tang, Qiang and Du, Shan}, title = {ArchitectHead: Continuous Level of Detail Control for 3D Gaussian Head Avatars}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1632-1642} }
SAFER-AiD: Saccade-Assisted Foveal-peripheral vision Enhanced Reconstruction for Adversarial Defense-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2026_WACV, author = {Liu, Jiayang and Ts'o, Daniel and Bu, Yiming and Qiu, Qinru}, title = {SAFER-AiD: Saccade-Assisted Foveal-peripheral vision Enhanced Reconstruction for Adversarial Defense}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1726-1735} }
Saliency-Guided DETR for Moment Retrieval and Highlight Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gordeev_2026_WACV, author = {Gordeev, Aleksandr and Dokholyan, Vladimir and Tolstykh, Irina and Kuprashevich, Maksim}, title = {Saliency-Guided DETR for Moment Retrieval and Highlight Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {907-916} }
MooTrack360: A Novel Fisheye Camera Dataset for Robust Multi Diary Cow Detection and Tracking-
[pdf]
[bibtex]@InProceedings{Christiansen_2026_WACV, author = {Christiansen, Rasmus Gjerlund K. and Van Nguyen, Toan and Malsk{\ae}r, Lasse Rose and Bodenhagen, Leon and Kraft, Dirk}, title = {MooTrack360: A Novel Fisheye Camera Dataset for Robust Multi Diary Cow Detection and Tracking}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {451-460} }
Tables Decoded: DELTA for Structure, TARQA for Understanding-
[pdf]
[supp]
[bibtex]@InProceedings{Rajput_2026_WACV, author = {Rajput, Jahanvi and Kudale, Dhruv and Kasturi, Saikiran and Verma, Utkarsh and Ramakrishnan, Ganesh}, title = {Tables Decoded: DELTA for Structure, TARQA for Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2775-2785} }
HumanGuideNet: Adapter-Based Alignment of Deep Neural Networks with Human Similarity Judgments-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2026_WACV, author = {Liu, Xufu and Yang, Yifan and Zhang, Zhengxin}, title = {HumanGuideNet: Adapter-Based Alignment of Deep Neural Networks with Human Similarity Judgments}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1798-1808} }
Mixed Diffusion for 3D Indoor Scene Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2026_WACV, author = {Hu, Siyi and Arroyo, Diego Mart{\'\i}n and Debats, Stephanie and Manhardt, Fabian and Carlone, Luca and Tombari, Federico}, title = {Mixed Diffusion for 3D Indoor Scene Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1262-1272} }
PSA-MIL: A Probabilistic Spatial Attention-Based Multiple Instance Learning for Whole Slide Image Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Peled_2026_WACV, author = {Peled, Sharon and Maruvka, Yosef E. and Freiman, Moti}, title = {PSA-MIL: A Probabilistic Spatial Attention-Based Multiple Instance Learning for Whole Slide Image Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1211-1220} }
Diverse Sketch Colorization with Content-Enhanced Style Representation and Recolorization Distillation-
[pdf]
[supp]
[bibtex]@InProceedings{Mao_2026_WACV, author = {Mao, Shuangming and Zhu, Haixiang}, title = {Diverse Sketch Colorization with Content-Enhanced Style Representation and Recolorization Distillation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1064-1073} }
A Framework for Real-Time Surgical Phase Recognition with Application to Robot-Assisted Partial Nephrectomy-
[pdf]
[supp]
[bibtex]@InProceedings{Mezzina_2026_WACV, author = {Mezzina, Marco and Vercauteren, Tom and Tuytelaars, Tinne and Blaschko, Matthew B.}, title = {A Framework for Real-Time Surgical Phase Recognition with Application to Robot-Assisted Partial Nephrectomy}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {245-254} }
Understanding Generative AI Capabilities in Everyday Image Editing Tasks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Collins_2026_WACV, author = {Collins, Brandon and Taesiri, Mohammad Reza and Bolton, Logan and Lai, Viet Dac and Dernoncourt, Franck and Bui, Trung and Nguyen, Anh Totti}, title = {Understanding Generative AI Capabilities in Everyday Image Editing Tasks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2231-2241} }
Distilling Diversity and Control in Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gandikota_2026_WACV, author = {Gandikota, Rohit and Bau, David}, title = {Distilling Diversity and Control in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1304-1313} }
Network-agnostic Distortion-robust Projections for Wide-angle Image Understanding-
[pdf]
[supp]
[bibtex]@InProceedings{Athwale_2026_WACV, author = {Athwale, Akshaya and Ahmad, Ola and Lalonde, Jean-Francois}, title = {Network-agnostic Distortion-robust Projections for Wide-angle Image Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {591-601} }
Interleaved Vision-and-Language Generation via Generative Voken-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zheng_2026_WACV, author = {Zheng, Kaizhi and He, Xuehai and Wang, Xin Eric}, title = {Interleaved Vision-and-Language Generation via Generative Voken}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {472-482} }
SaccadeX: Directed Acyclic Graph-based Semi-Supervised Learning of Continuous Ocular Dynamics from Sparse Neuromorphic Streams-
[pdf]
[supp]
[bibtex]@InProceedings{Bandara_2026_WACV, author = {Bandara, Nuwan and Kandappu, Thivya and Misra, Archan}, title = {SaccadeX: Directed Acyclic Graph-based Semi-Supervised Learning of Continuous Ocular Dynamics from Sparse Neuromorphic Streams}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1384-1394} }
CAAC: Confidence-Aware Attention Calibration to Reduce Hallucinations in Large Vision-Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Fazli_2026_WACV, author = {Fazli, Mehrdad and Wei, Bowen and Sari, Ahmet and Zhu, Ziwei}, title = {CAAC: Confidence-Aware Attention Calibration to Reduce Hallucinations in Large Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1242-1251} }
EmojiDiff: Advanced Facial Expression Control with High Identity Preservation in Portrait Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiang_2026_WACV, author = {Jiang, Liangwei and Li, Ruida and Zhang, Zhifeng and Fang, Shuo and Ma, Chenguang}, title = {EmojiDiff: Advanced Facial Expression Control with High Identity Preservation in Portrait Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {328-338} }
A Universal Self-Attention Enhancement for Bridging Low-bit Quantization and Vision Transformers-
[pdf]
[bibtex]@InProceedings{Qian_2026_WACV, author = {Qian, Jiahe and Wang, Peisong and Zhuge, Zhengyang and Hu, Qinghao and Cheng, Jian}, title = {A Universal Self-Attention Enhancement for Bridging Low-bit Quantization and Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {360-370} }
ORCA: Object Recognition and Comprehension for Archiving Marine Species-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wong_2026_WACV, author = {Wong, Yuk-Kwan and Liang, Haixin and Ma, Zeyu and Chen, Yiwei and Zheng, Ziqiang and Gotama, Rinaldi and Sebastian, Pascal and Sparks, Lauren D. and Yeung, Sai-Kit}, title = {ORCA: Object Recognition and Comprehension for Archiving Marine Species}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1597-1609} }
Learnable Query-Enhanced Pose Transformation-
[pdf]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Yi-Zhen and Shuai, Hong-Han}, title = {Learnable Query-Enhanced Pose Transformation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2032-2041} }
Detecting Out-of-Distribution Objects through Class-Conditioned Inpainting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Quang-Huy and Zhou, Jin Peng and Liu, Zhenzhen and Bui, Khanh-Huyen and Weinberger, Kilian Q. and Chao, Wei-Lun and Le, Dung D.}, title = {Detecting Out-of-Distribution Objects through Class-Conditioned Inpainting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1937-1947} }
GrounDiff: Diffusion-Based Ground Surface Generation from Digital Surface Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dhaouadi_2026_WACV, author = {Dhaouadi, Oussema and Meier, Johannes and Kaiser, Jacques and Cremers, Daniel}, title = {GrounDiff: Diffusion-Based Ground Surface Generation from Digital Surface Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1355-1364} }
What Happens When: Learning Temporal Orders of Events in Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ahn_2026_WACV, author = {Ahn, Daechul and Choi, Yura and Choi, Hyeonbeom and Cho, Seongwon and Kim, San and Choi, Jonghyun}, title = {What Happens When: Learning Temporal Orders of Events in Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2786-2796} }
Identity Verification from Human Scent using Channel Representation of 2D Gas Chromatography-Mass Spectrometry Data-
[pdf]
[supp]
[bibtex]@InProceedings{Spetlik_2026_WACV, author = {Spetlik, Radim and Hlavsa, Jan and \v{C}echov\'a, Jana and Pojmanov\'a, Petra and Matas, Jiri and Urban, \v{S}t\v{e}p\'an}, title = {Identity Verification from Human Scent using Channel Representation of 2D Gas Chromatography-Mass Spectrometry Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1471-1480} }
DoTA: Latent Distribution Conditioned Data Attribution for Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Joshi_2026_WACV, author = {Joshi, Ninad and Srivastava, Vivek and Karande, Shirish}, title = {DoTA: Latent Distribution Conditioned Data Attribution for Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2022-2031} }
Face-LLaVA: Facial Expression and Attribute Understanding through Instruction Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chaubey_2026_WACV, author = {Chaubey, Ashutosh and Guan, Xulang and Soleymani, Mohammad}, title = {Face-LLaVA: Facial Expression and Attribute Understanding through Instruction Tuning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2648-2660} }
UI-Styler: Ultrasound Image Style Transfer with Class-Aware Prompts for Cross-Device Diagnosis Using a Frozen Black-Box Inference Network-
[pdf]
[supp]
[bibtex]@InProceedings{Do-Tran_2026_WACV, author = {Do-Tran, Nhat-Tuong and Le, Ngoc-Hoang-Lam and Huang, Ching-Chun}, title = {UI-Styler: Ultrasound Image Style Transfer with Class-Aware Prompts for Cross-Device Diagnosis Using a Frozen Black-Box Inference Network}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2765-2774} }
Dressing the Imagination: A Dataset for AI-Powered Translation of Text into Fashion Outfits and A Novel NeRA Adapter for Enhanced Feature Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Deshmukh_2026_WACV, author = {Deshmukh, Gayatri and De, Somsubhra and Sehgal, Chirag and Gupta, Jishu Sen and Mittal, Sparsh}, title = {Dressing the Imagination: A Dataset for AI-Powered Translation of Text into Fashion Outfits and A Novel NeRA Adapter for Enhanced Feature Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2094-2103} }
Marshaled Learning: Bridging Large Neural Networks with Memory-Constrained Trusted Execution Environments in Federated Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Ding_2026_WACV, author = {Ding, Shiwei and Yuan, Xiaoyong and Wang, Zhenlin and Zhang, Lan Emily and Ateniese, Giuseppe}, title = {Marshaled Learning: Bridging Large Neural Networks with Memory-Constrained Trusted Execution Environments in Federated Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {647-656} }
Reconstructing Realistic and Relightable Eyes-
[pdf]
[supp]
[bibtex]@InProceedings{Khademi_2026_WACV, author = {Khademi, Wesley and Kundu, Jogendra and An, Yatong and Fix, Alexander and Colmenares, David}, title = {Reconstructing Realistic and Relightable Eyes}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2242-2252} }
PS3: Part Level Instance Segmentation in 3D-
[pdf]
[supp]
[bibtex]@InProceedings{Yen_2026_WACV, author = {Yen, Hong-Xuan and Chen, Chiamin and Wang, Yanqing and Liu, Yu-Lun and Sun, Min}, title = {PS3: Part Level Instance Segmentation in 3D}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {898-906} }
UNO: Unifying One-stage Video Scene Graph Generation via Object-Centric Visual Representation Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Le_2026_WACV, author = {Le, Huy and Chung, Nhat and Kieu, Tung and Yang, Jingkang and Le, Ngan}, title = {UNO: Unifying One-stage Video Scene Graph Generation via Object-Centric Visual Representation Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2797-2807} }
ITSELF: Attention Guided Fine-Grained Alignment for Vision-Language Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Tien-Huy and Tran, Huu-Loc and Ngo, Thanh Duc}, title = {ITSELF: Attention Guided Fine-Grained Alignment for Vision-Language Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1448-1458} }
Segmentation-Aware Latent Diffusion for Satellite Image Super-Resolution: Enabling Smallholder Farm Boundary Delineation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Agarwal_2026_WACV, author = {Agarwal, Aditi and Jain, Anjali and Saxena, Nikita and Deshpande, Ishan and Kazmierski, Michal and Annkah, Abigail and Sherman, Nadav and Shanmugam, Karthikeyan and Talekar, Alok and Rajan, Vaibhav}, title = {Segmentation-Aware Latent Diffusion for Satellite Image Super-Resolution: Enabling Smallholder Farm Boundary Delineation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1864-1874} }
Eff-GRot: Efficient and Generalizable Rotation Estimation with Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mathioulakis_2026_WACV, author = {Mathioulakis, Fanis and Radevski, Gorjan and Tuytelaars, Tinne}, title = {Eff-GRot: Efficient and Generalizable Rotation Estimation with Transformers}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {412-421} }
Roadside Monocular 3D Detection Prompted by 2D Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ma_2026_WACV, author = {Ma, Yechi and Hua, Wei and Li, Yanan and Kong, Shu}, title = {Roadside Monocular 3D Detection Prompted by 2D Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1895-1905} }
Divide and Refine: Enhancing Multimodal Representation and Explainability for Emotion Recognition in Conversation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Mai_2026_WACV, author = {Mai, Anh-Tuan and Nguyen, Cam-Van Thi and Le, Duc-Trong}, title = {Divide and Refine: Enhancing Multimodal Representation and Explainability for Emotion Recognition in Conversation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2700-2709} }
End-to-End Fine-Tuning of 3D Texture Generation using Differentiable Rewards-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zamani_2026_WACV, author = {Zamani, AmirHossein and Xie, Tianhao and Aghdam, Amir G. and Popa, Tiberiu and Belilovsky, Eugene}, title = {End-to-End Fine-Tuning of 3D Texture Generation using Differentiable Rewards}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {171-180} }
ImageNet-sES: A First Systematic Study of Sensor-Environment Simulation Anchored by Real Recaptures-
[pdf]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Ji-yoon and Baek, Eunsu and Kim, Hyung-Sin}, title = {ImageNet-sES: A First Systematic Study of Sensor-Environment Simulation Anchored by Real Recaptures}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1117-1126} }
MEDAL: multi-modal MEta-space Distillation and ALignment for Visual Compatibility Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Sanny_2026_WACV, author = {Sanny, Dween Rabius and Verma, Vinay Kumar and Sircar, Prateek and Gupta, Deepak}, title = {MEDAL: multi-modal MEta-space Distillation and ALignment for Visual Compatibility Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {888-897} }
LiDAR-DHMT: LiDAR-Adaptive Dual Hierarchical Mask Transformer for Robust Freespace Detection and Semantic Segmentation-
[pdf]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Siyu and Han, Ting and Zhang, Changshe and Luo, Xin and Chen, Huan and Wu, Meiliu and Cai, Guorong and Su, Jinhe}, title = {LiDAR-DHMT: LiDAR-Adaptive Dual Hierarchical Mask Transformer for Robust Freespace Detection and Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1252-1261} }
Layout Anything: One Transformer for Universal Room Layout Estimation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Mia_2026_WACV, author = {Mia, Md Sohag and Adnan, Muhammad Abdullah}, title = {Layout Anything: One Transformer for Universal Room Layout Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1565-1574} }
TS-PCI: Point Cloud Frame Interpolation with Time-Aware Point Cloud Sampling and Self-Supervised Learning Strategy-
[pdf]
[bibtex]@InProceedings{Matsuzaki_2026_WACV, author = {Matsuzaki, Kohei and Nonaka, Keisuke}, title = {TS-PCI: Point Cloud Frame Interpolation with Time-Aware Point Cloud Sampling and Self-Supervised Learning Strategy}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {54-65} }
UniCoRN: Latent Diffusion-based Unified Controllable Image Restoration Network across Multiple Degradations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mandal_2026_WACV, author = {Mandal, Debabrata and Chattopadhyay, Soumitri and Tong, Guansen and Chakravarthula, Praneeth}, title = {UniCoRN: Latent Diffusion-based Unified Controllable Image Restoration Network across Multiple Degradations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1543-1553} }
CURIO: Curvature-Aligned and Efficient OCR for Low-Resource Historical Manuscripts-
[pdf]
[supp]
[bibtex]@InProceedings{Gunda_2026_WACV, author = {Gunda, Sai Madhusudan and Ghosh, Tathagata and Sandral, Simran Singh and Sarvadevabhatla, Ravi Kiran}, title = {CURIO: Curvature-Aligned and Efficient OCR for Low-Resource Historical Manuscripts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2011-2021} }
InteracTalker: Prompt-Based Human-Object Interaction with Co-Speech Gesture Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rajan_2026_WACV, author = {Rajan, Sreehari and Bhosikar, Kunal and Sharma, Charu}, title = {InteracTalker: Prompt-Based Human-Object Interaction with Co-Speech Gesture Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1438-1447} }
EllipssianNet: Image-guided Sampling of 2D Gaussians for Gaussian Splatting-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, MyoungGon and Ahn, JeongHyeon and Park, Seohyeon and Kim, Hyemi and Park, Seunghyun and Hwang, Jung Ho and Han, JungHyun}, title = {EllipssianNet: Image-guided Sampling of 2D Gaussians for Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2104-2113} }
SSplain: Sparse and Smooth Explainer for Retinopathy of Prematurity Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sunger_2026_WACV, author = {Sunger, Elifnur and Imbiriba, Tales and Campbell, Peter and Erdogmus, Deniz and Ioannidis, Stratis and Dy, Jennifer}, title = {SSplain: Sparse and Smooth Explainer for Retinopathy of Prematurity Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1705-1715} }
AdaptViG: Adaptive Vision GNN with Exponential Decay Gating-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Munir_2026_WACV, author = {Munir, Mustafa and Rahman, Md Mostafijur and Marculescu, Radu}, title = {AdaptViG: Adaptive Vision GNN with Exponential Decay Gating}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {440-450} }
PADM: A Physics-aware Diffusion Model for Attenuation Correction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Pham_2026_WACV, author = {Pham, Trung Kien and Vu, Hoang Minh and Chu, Anh Duc and Nguyen, Dac Thai and Nguyen, Trung Thanh and Truong, Thao Nguyen and Son, Mai Hong and Nguyen, Thanh Trung and Le Nguyen, Phi}, title = {PADM: A Physics-aware Diffusion Model for Attenuation Correction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2606-2615} }
MEGA-PCC: A Mamba-based Efficient Approach for Joint Geometry and Attribute Point Cloud Compression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hsieh_2026_WACV, author = {Hsieh, Kai-Hsiang and Yim, Monyneath and Peng, Wen-Hsiao and Chiang, Jui-Chiu}, title = {MEGA-PCC: A Mamba-based Efficient Approach for Joint Geometry and Attribute Point Cloud Compression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1820-1830} }
Interaction-via-Actions: Cattle Interaction Detection with Joint Learning of Action-Interaction Latent Space-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nakagawa_2026_WACV, author = {Nakagawa, Ren and Yang, Yang and Shinoda, Risa and Santo, Hiroaki and Oyama, Kenji and Okura, Fumio and Ohkawa, Takenao}, title = {Interaction-via-Actions: Cattle Interaction Detection with Joint Learning of Action-Interaction Latent Space}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1979-1988} }
RobustGait: Robustness Analysis for Appearance Based Gait Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sayera_2026_WACV, author = {Sayera, Reeshoon and Kumar, Akash and Mitra, Sirshapan and Kamtam, Prudvi and Rawat, Yogesh S}, title = {RobustGait: Robustness Analysis for Appearance Based Gait Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2541-2552} }
Zero-Shot Video Deraining with Video Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Varanka_2026_WACV, author = {Varanka, Tuomas and Gonzalez, Juan Luis and Kim, Hyeongwoo and Garrido, Pablo and Yao, Xu}, title = {Zero-Shot Video Deraining with Video Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {677-687} }
DynaGSLAM: Real-Time Gaussian-Splatting SLAM for Online Rendering, Tracking, Motion Predictions of Moving Objects in Dynamic Scenes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Runfa Blark and Shaghaghi, Mahdi and Suzuki, Keito and Liu, Xinshuang and Moparthi, Varun and Du, Bang and Curtis, Walker and Renschler, Martin and Lee, Ki Myung Brian and Atanasov, Nikolay and Nguyen, Truong}, title = {DynaGSLAM: Real-Time Gaussian-Splatting SLAM for Online Rendering, Tracking, Motion Predictions of Moving Objects in Dynamic Scenes}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2434-2444} }
ChameleonTuner: Automatic ISP Color Tuning in Subjective Scenarios-
[pdf]
[bibtex]@InProceedings{Tan_2026_WACV, author = {Tan, Zijie and Yue, Yuxin and Rashidi, Bahador}, title = {ChameleonTuner: Automatic ISP Color Tuning in Subjective Scenarios}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {297-307} }
UnderWater SLAM with Laser-light sectioning method using ST-GAT-
[pdf]
[supp]
[bibtex]@InProceedings{Gao_2026_WACV, author = {Gao, Heyang and Ichimaru, Kazuto and Iwaguchi, Takafumi and Kawasaki, Hiroshi}, title = {UnderWater SLAM with Laser-light sectioning method using ST-GAT}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {88-96} }
Non-Contact Blood Pressure Estimation from Face Videos via Physiology-Aware Contrastive Learning-
[pdf]
[bibtex]@InProceedings{Son_2026_WACV, author = {Son, JaeHyuk and Choi, Young-Seok}, title = {Non-Contact Blood Pressure Estimation from Face Videos via Physiology-Aware Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2414-2423} }
Shift-Equivariant Complex-Valued Convolutional Neural Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gabot_2026_WACV, author = {Gabot, Quentin and Lim, Teck-Yian and Fix, Jeremy and Frontera-Pons, Joana and Ren, Chengfang and Ovarlez, Jean-Philippe}, title = {Shift-Equivariant Complex-Valued Convolutional Neural Networks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2575-2584} }
Explaining the Unseen: Multimodal Vision-Language Reasoning for Situational Awareness in Underground Mining Disasters-
[pdf]
[arXiv]
[bibtex]@InProceedings{Jewel_2026_WACV, author = {Jewel, Mizanur Rahman and Elmahallawy, Mohamed and Madria, Sanjay and Frimpong, Samuel}, title = {Explaining the Unseen: Multimodal Vision-Language Reasoning for Situational Awareness in Underground Mining Disasters}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1324-1333} }
Zero-Shot Coreset Selection via Iterative Subspace Sampling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Griffin_2026_WACV, author = {Griffin, Brent A. and Marks, Jacob and Corso, Jason J.}, title = {Zero-Shot Coreset Selection via Iterative Subspace Sampling}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2114-2124} }
Test-Time Adaptation through Semantically-guided Feature Decomposition for Few-shot Chest X-ray Diagnosis-
[pdf]
[supp]
[bibtex]@InProceedings{Mahawar_2026_WACV, author = {Mahawar, Jayant and Paul, Angshuman}, title = {Test-Time Adaptation through Semantically-guided Feature Decomposition for Few-shot Chest X-ray Diagnosis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2445-2454} }
GenHSI: Controllable Generation of Human-Scene Interaction Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Zekun and Zhou, Rui and Sajnani, Rahul and Cong, Xiaoyan and Ritchie, Daniel and Sridhar, Srinath}, title = {GenHSI: Controllable Generation of Human-Scene Interaction Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {138-149} }
Unified Video Anomaly Detection Model for Detecting Different Anomaly Types-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Kijung and Jo, Youngwan and Ahn, Sunghyun and Park, Sanghyun}, title = {Unified Video Anomaly Detection Model for Detecting Different Anomaly Types}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {784-794} }
M-ErasureBench: A Comprehensive Multimodal Evaluation Benchmark for Concept Erasure in Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Weng_2026_WACV, author = {Weng, Ju-Hsuan and Liao, Jia-Wei and Chou, Cheng-Fu and Chen, Jun-Cheng}, title = {M-ErasureBench: A Comprehensive Multimodal Evaluation Benchmark for Concept Erasure in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {527-536} }
Leveraging Pretrained Representations for Cross-Modal Point Cloud Completion-
[pdf]
[supp]
[bibtex]@InProceedings{Kale_2026_WACV, author = {Kale, Kshitij and U, Hrishikesh and sreenidhe, V and S, Shylaja S}, title = {Leveraging Pretrained Representations for Cross-Modal Point Cloud Completion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {97-105} }
Moire Zero: An Efficient and High-Performance Neural Architecture for Moire Removal-
[pdf]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Seungryong and Baek, Woojeong and Kim, Younghyun and Kim, Eunwoo and Moon, Haru and Yoo, Donggon and Park, Eunbyung}, title = {Moire Zero: An Efficient and High-Performance Neural Architecture for Moire Removal}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2520-2530} }
DermEVAL: A Dermatologist-Reviewed Benchmark for Multimodal Large Language Models-
[pdf]
[bibtex]@InProceedings{Zhao_2026_WACV, author = {Zhao, Hongjin and Li, Weihao and Qin, Zhenyue and Ji, Ge-Peng and Liu, Yang and Gedeon, Tom and Barnes, Nick}, title = {DermEVAL: A Dermatologist-Reviewed Benchmark for Multimodal Large Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {927-937} }
RAVU: Retrieval Augmented Video Understanding with Compositional Reasoning over Graph-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Malik_2026_WACV, author = {Malik, Sameer and Singh, Ayush and Yamada, Moyuru and Aggarwal, Dishank}, title = {RAVU: Retrieval Augmented Video Understanding with Compositional Reasoning over Graph}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2869-2878} }
Low-Rank Expert Merging for Multi-Source Domain Adaptation in Person Re-Identification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nehdi_2026_WACV, author = {Nehdi, Taha Mustapha and Mrabah, Nairouz and Belal, Atif and Pedersoli, Marco and Granger, Eric}, title = {Low-Rank Expert Merging for Multi-Source Domain Adaptation in Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1809-1819} }
BOP-Distrib: Revisiting 6D Pose Estimation Benchmarks for Better Evaluation under Visual Ambiguities-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Meden_2026_WACV, author = {Meden, Boris and Brazi, Asma and de Chamisso, Fabrice Mayran and Bourgeois, Steve and Lepetit, Vincent}, title = {BOP-Distrib: Revisiting 6D Pose Estimation Benchmarks for Better Evaluation under Visual Ambiguities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1575-1585} }
DRWKV: Focusing on Object Edges for Low-Light Image Enhancement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bai_2026_WACV, author = {Bai, Xuecheng and Wang, Yuxiang and Hu, Boyu and Jie, Qinyuan and Xu, Chuanzhi and Li, Kechen and Xiao, Hongru and Chung, Vera}, title = {DRWKV: Focusing on Object Edges for Low-Light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1554-1564} }
Intra-Class Probabilistic Embeddings for Uncertainty Estimation in Vision-Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2026_WACV, author = {Lin, Zhenxiang and Haghighat, Maryam and Browne, Will and Miller, Dimity}, title = {Intra-Class Probabilistic Embeddings for Uncertainty Estimation in Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2327-2337} }
ART: Actor-Related Tubelet for Detecting Complex-shaped Action Tubes-
[pdf]
[supp]
[bibtex]@InProceedings{Zhao_2026_WACV, author = {Zhao, Jiaojiao}, title = {ART: Actor-Related Tubelet for Detecting Complex-shaped Action Tubes}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {308-317} }
Cluster-Guided Adversarial Perturbations for Robust Contrastive Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Seo_2026_WACV, author = {Seo, Seongyun and Han, Sungmin and Lee, Jeonghyun and Lee, Sangkyun}, title = {Cluster-Guided Adversarial Perturbations for Robust Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {350-359} }
IDEAL-M3D: Instance Diversity-Enriched Active Learning for Monocular 3D Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Meier_2026_WACV, author = {Meier, Johannes and G\"unther, Florian and Marin, Riccardo and Dhaouadi, Oussema and Kaiser, Jacques and Cremers, Daniel}, title = {IDEAL-M3D: Instance Diversity-Enriched Active Learning for Monocular 3D Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {181-191} }
TaxonRL: Reinforcement Learning with Intermediate Rewards for Interpretable Fine-Grained Visual Reasoning-
[pdf]
[bibtex]@InProceedings{von_Klinski_2026_WACV, author = {von Klinski, Maximilian and Schall, Maximilian}, title = {TaxonRL: Reinforcement Learning with Intermediate Rewards for Interpretable Fine-Grained Visual Reasoning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2485-2498} }
Revisiting Retentive Networks for Fast Range-View 3D LiDAR Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Mosco_2026_WACV, author = {Mosco, Simone and Fusaro, Daniel and Li, Wanmeng and Pretto, Alberto}, title = {Revisiting Retentive Networks for Fast Range-View 3D LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2499-2509} }
GraspDiffusion: Synthesizing Realistic Whole-body Hand-Object Interaction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kwon_2026_WACV, author = {Kwon, Patrick and Chen, Chen and Joo, Hanbyul}, title = {GraspDiffusion: Synthesizing Realistic Whole-body Hand-Object Interaction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2392-2403} }
Understanding Human-Like Biases in VLMs via Subjective Face Analytics-
[pdf]
[supp]
[bibtex]@InProceedings{Roygaga_2026_WACV, author = {Roygaga, Chaitanya and Bharati, Aparna}, title = {Understanding Human-Like Biases in VLMs via Subjective Face Analytics}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {514-526} }
A Woman with a Knife or A Knife with a Woman? Measuring Directional Bias Amplification in Image Captions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nair_2026_WACV, author = {Nair, Rahul and Tokas, Bhanu and Kerner, Hannah}, title = {A Woman with a Knife or A Knife with a Woman? Measuring Directional Bias Amplification in Image Captions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {255-264} }
Vision-informed Semantic Text Alignment for Open-set Recognition in Remote Sensing-
[pdf]
[supp]
[bibtex]@InProceedings{Gole_2026_WACV, author = {Gole, Siddhant and Pal, Akash and Jha, Ankit and Chaudhuri, Subhasis and Banerjee, Biplab}, title = {Vision-informed Semantic Text Alignment for Open-set Recognition in Remote Sensing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2828-2837} }
Referring Change Detection in Remote Sensing Imagery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Korkmaz_2026_WACV, author = {Korkmaz, Yilmaz and Paranjape, Jay N. and de Melo, Celso M. and Patel, Vishal M.}, title = {Referring Change Detection in Remote Sensing Imagery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {106-116} }
M4U: Evaluating Multilingual Understanding and Reasoning for Large Multimodal Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Hongyu and Xu, Jiayu and Xie, Senwei and Wang, Ruiping and Li, Jialin and Xie, Zhaojie and Zhang, Bin and Xiong, Chuyan and Chen, Xilin}, title = {M4U: Evaluating Multilingual Understanding and Reasoning for Large Multimodal Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {382-392} }
Snapmoji: Instant Generation of Animatable Dual-Stylized Avatars-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Eric Ming and Liu, Di and Ma, Sizhuo and Vasilkovsky, Michael and Zhou, Bing and Gao, Qiang and Wang, Wenzhou and Luo, Jiahao and Metaxas, Dimitris N. and Sitzmann, Vincent and Wang, Jian}, title = {Snapmoji: Instant Generation of Animatable Dual-Stylized Avatars}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1948-1958} }
BanglaProtha: Evaluating Vision Language Models in Underrepresented Long-tail Cultural Contexts-
[pdf]
[supp]
[bibtex]@InProceedings{Fahim_2026_WACV, author = {Fahim, Md and Rahman, Md Sakib Ul and Rahman, Akm Moshiur and Ishmam, Md Farhan and Rahman, Md Tasmim and Shifat, Fariha Tanjim and Haider, Fabiha and Alam Bhuiyan, Md Farhad}, title = {BanglaProtha: Evaluating Vision Language Models in Underrepresented Long-tail Cultural Contexts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1159-1169} }
CineVerse: Consistent Keyframe Synthesis for Cinematic Scene Composition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Phung_2026_WACV, author = {Phung, Quynh and Mai, Long and Heilbron, Fabian David Caba and Liu, Feng and Huang, Jia-Bin and Ham, Cusuh}, title = {CineVerse: Consistent Keyframe Synthesis for Cinematic Scene Composition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2626-2636} }
MBTI: Metric-Based Textual Inversion for Fine-Grained Image Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Chae_2026_WACV, author = {Chae, Byungkwan and Choi, Youngjae and Kim, Heewon}, title = {MBTI: Metric-Based Textual Inversion for Fine-Grained Image Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1106-1116} }
PRISM-CAFO: Prior-conditioned Remote-sensing Infrastructure Segmentation and Mapping for CAFOs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hoque_2026_WACV, author = {Hoque, Oishee Bintey and Mandal, Nibir Chandra and Luong, Kyle and Wilson, Amanda and Swarup, Samarth and Marathe, Madhav and Adiga, Abhijin}, title = {PRISM-CAFO: Prior-conditioned Remote-sensing Infrastructure Segmentation and Mapping for CAFOs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {2083-2093} }
Gaussian Representations for Video-
[pdf]
[supp]
[bibtex]@InProceedings{Shah_2026_WACV, author = {Shah, Sachin and Choudhury, Anustup and Su, Guan-Ming and Pytlarz, Jaclyn and Metzler, Christopher A. and Mittal, Trisha}, title = {Gaussian Representations for Video}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {827-837} }
HyPCA-Net: Advancing Multimodal Fusion in Medical Image Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dhar_2026_WACV, author = {Dhar, Joy and Pandey, Manish Kumar and Das Chakladar, Debashis and Haghighat, Maryam and Alavi, Azadeh and Mistry, Sajib and Zaidi, Nayyar}, title = {HyPCA-Net: Advancing Multimodal Fusion in Medical Image Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {1831-1840} }
No MoCap Needed: Post-Training Motion Diffusion Models with Reinforcement Learning using Only Textual Prompts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Girolamo_2026_WACV, author = {Girolamo, Macaluso and Lorenzo, Mandelli and Bicchierai, Mirko and Berretti, Stefano and Bagdanov, Andrew D.}, title = {No MoCap Needed: Post-Training Motion Diffusion Models with Reinforcement Learning using Only Textual Prompts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {967-976} }
Back
