Papers
- Back
ATM: Enhanced Alignment for Text-to-Motion Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Han_2026_WACV, author = {Han, Ke and Lyu, Yueming and Yu, Weichen and Sebe, Nicu}, title = {ATM: Enhanced Alignment for Text-to-Motion Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6862-6872} }
GFT: Graph Feature Tuning for Efficient Point Cloud Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dhakal_2026_WACV, author = {Dhakal, Manish and Dasari, Venkat R and Sunderraman, Rajshekhar and Ding, Yi}, title = {GFT: Graph Feature Tuning for Efficient Point Cloud Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7955-7964} }
FG-TRACER: Tracing Information Flow in Multimodal Large Language Models in Free-Form Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Saporita_2026_WACV, author = {Saporita, Alessia and Pipoli, Vittorio and Bolelli, Federico and Baraldi, Lorenzo and Acquaviva, Andrea and Ficarra, Elisa}, title = {FG-TRACER: Tracing Information Flow in Multimodal Large Language Models in Free-Form Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7903-7912} }
CAST: Evaluating Multi-Object Trackers with Context-Aware Switch and Transfer Scores-
[pdf]
[bibtex]@InProceedings{Bai_2026_WACV, author = {Bai, Jin and Hager, Gregory D.}, title = {CAST: Evaluating Multi-Object Trackers with Context-Aware Switch and Transfer Scores}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7260-7268} }
NavMapFusion: Diffusion-based Fusion of Navigation Maps for Online Vectorized HD Map Construction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Monninger_2026_WACV, author = {Monninger, Thomas and Zhang, Zihan and Staab, Steffen and Ding, Sihao}, title = {NavMapFusion: Diffusion-based Fusion of Navigation Maps for Online Vectorized HD Map Construction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7945-7954} }
DREAM: Dynamic Prompts and GuidedMix for Efficient Continual Adaptation of Visual-Language Models-
[pdf]
[bibtex]@InProceedings{Chee_2026_WACV, author = {Chee, Evelyn and Lee, Mong Li and Hsu, Wynne}, title = {DREAM: Dynamic Prompts and GuidedMix for Efficient Continual Adaptation of Visual-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5853-5863} }
Overcoming Small Data Limitations in Video-Based Infant Respiration Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Song_2026_WACV, author = {Song, Liyang and Bishnoi, Hardik and Manne, Sai Kumar Reddy and Ostadabbas, Sarah and Taylor, Briana J. and Wan, Michael}, title = {Overcoming Small Data Limitations in Video-Based Infant Respiration Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6340-6349} }
Distribution Highlighted Reference-based Label Distribution Learning for Facial Age Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Suzuki_2026_WACV, author = {Suzuki, Satoshi and Yamaguchi, Shin'ya and Takeda, Shoichiro and Kaneko, Takuhiro and Orihashi, Shota and Masumura, Ryo}, title = {Distribution Highlighted Reference-based Label Distribution Learning for Facial Age Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6464-6473} }
IMKD: Intensity-Aware Multi-Level Knowledge Distillation for Camera-Radar Fusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mishra_2026_WACV, author = {Mishra, Shashank and Patil, Karan and Stricker, Didier and Rambach, Jason}, title = {IMKD: Intensity-Aware Multi-Level Knowledge Distillation for Camera-Radar Fusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6027-6038} }
Leveraging Semantic Attribute Binding for Free-Lunch Color Control in Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Laria_2026_WACV, author = {Laria, H\'ector and Gomez-Villa, Alexandra and Qin, Jiang and Butt, Muhammad Atif and Raducanu, Bogdan and Vazquez-Corral, Javier and van de Weijer, Joost and Wang, Kai}, title = {Leveraging Semantic Attribute Binding for Free-Lunch Color Control in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7689-7698} }
ForestSplats: Deformable Transient Field for Gaussian Splatting in the Wild-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Wongi and Nam, Myeongseok and Kim, Siwon and Jo, Sangwoo and Lee, Soomok}, title = {ForestSplats: Deformable Transient Field for Gaussian Splatting in the Wild}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6978-6987} }
3D Cell Oversegmentation Correction via Geo-Wasserstein Divergence-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Peter and Chang, Bryan and A Creasey, Olivia and Sneddon, Julie Beth and Gartner, Zev J and Liu, Yining}, title = {3D Cell Oversegmentation Correction via Geo-Wasserstein Divergence}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7534-7543} }
STRinGS: Selective Text Refinement in Gaussian Splatting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Raundhal_2026_WACV, author = {Raundhal, Abhinav and Behera, Gaurav and Narayanan, P. J. and Sarvadevabhatla, Ravi Kiran and Tapaswi, Makarand}, title = {STRinGS: Selective Text Refinement in Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8574-8583} }
SceneEdited: A City-Scale Benchmark for 3D HD Map Updating via Image-Guided Change Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2026_WACV, author = {Lin, Chun-Jung and Chin, Tat-Jun and Garg, Sourav and Dayoub, Feras}, title = {SceneEdited: A City-Scale Benchmark for 3D HD Map Updating via Image-Guided Change Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6330-6339} }
START: Spatial and Textual Learning for Chart Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2026_WACV, author = {Liu, Zhuoming and Gao, Xiaofeng and Niu, Feiyang and Gao, Qiaozi and Liu, Liu and Piramuthu, Robinson}, title = {START: Spatial and Textual Learning for Chart Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8146-8156} }
Adversarial Pseudo-replay for Exemplar-free Class-incremental Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Honda_2026_WACV, author = {Honda, Hiroto}, title = {Adversarial Pseudo-replay for Exemplar-free Class-incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7493-7502} }
AugMapNet: Improving Spatial Latent Structure via BEV Grid Augmentation for Enhanced Vectorized Online HD Map Construction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Monninger_2026_WACV, author = {Monninger, Thomas and Anwar, Md Zafar and Antol, Stanislaw and Staab, Steffen and Ding, Sihao}, title = {AugMapNet: Improving Spatial Latent Structure via BEV Grid Augmentation for Enhanced Vectorized Online HD Map Construction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8541-8550} }
Mem-MLP: Real-Time 3D Human Motion Generation from Sparse Inputs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mutlu_2026_WACV, author = {Mutlu, Sinan and Angelis, Georgios F. and Ozkan, Savas and Wisbey, Paul and Drosou, Anastasios and Ozay, Mete}, title = {Mem-MLP: Real-Time 3D Human Motion Generation from Sparse Inputs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8343-8352} }
SurgXBench: Explainable Vision-Language Model Benchmark for Surgery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2026_WACV, author = {Cheng, Jiajun and Zhao, Xianwu and Liu, Sainan and Yu, Xiaofan and Prakash, Ravi and Codd, Patrick J. and Katz, Jonathan Elliott and Lin, Shan}, title = {SurgXBench: Explainable Vision-Language Model Benchmark for Surgery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8188-8198} }
CanKD: Cross-Attention-based Non-local Operation for Feature-based Knowledge Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sun_2026_WACV, author = {Sun, Shizhe and Ohyama, Wataru}, title = {CanKD: Cross-Attention-based Non-local Operation for Feature-based Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8606-8616} }
UniTabBank: A Large Scale Multi-Lingual, Multi-Layout, Multi-Type, Multi-Format Dataset for Table Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Mondal_2026_WACV, author = {Mondal, Ajoy and Mundra, Saumya and Dasgupta, Avijit and Jawahar, C.V.}, title = {UniTabBank: A Large Scale Multi-Lingual, Multi-Layout, Multi-Type, Multi-Format Dataset for Table Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6486-6495} }
Being Positive about Negative Queries: Exclusion Aware Multimodal Retrieval using Disentangled Representations-
[pdf]
[bibtex]@InProceedings{Jha_2026_WACV, author = {Jha, Prachi and Bhatia, Sumit and Bedathur, Srikanta}, title = {Being Positive about Negative Queries: Exclusion Aware Multimodal Retrieval using Disentangled Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7832-7841} }
CORA: Consistency-Guided Semi-Supervised Framework for Reasoning Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Howlader_2026_WACV, author = {Howlader, Prantik and Nguyen-Canh, Hoang and Das, Srijan and Xu, Jingyi and Le, Hieu and Samaras, Dimitris}, title = {CORA: Consistency-Guided Semi-Supervised Framework for Reasoning Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5934-5944} }
Point2Pose: A Generative Framework for 3D Human Pose Estimation with Multi-View Point Cloud Dataset-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Hyunsoo and Jeon, Daeum and Oh, Hyeokjae}, title = {Point2Pose: A Generative Framework for 3D Human Pose Estimation with Multi-View Point Cloud Dataset}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6744-6753} }
GDoFS: Gaussian DoF Separation for Plausible 3D Geometry in Sparse-View 3DGS-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Yongsung and Choi, Jooyoung and Yoon, Sungroh}, title = {GDoFS: Gaussian DoF Separation for Plausible 3D Geometry in Sparse-View 3DGS}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6643-6652} }
Distilling Offline Action Detection Models into Real-Time Streaming Models-
[pdf]
[bibtex]@InProceedings{Patel_2026_WACV, author = {Patel, Deep and Babazaki, Yasunori and Nagase, Yasuto and Melvin, Iain and Min, Martin Renqiang}, title = {Distilling Offline Action Detection Models into Real-Time Streaming Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6205-6214} }
Remote Sensing Forestry Similarity Convolution-
[pdf]
[bibtex]@InProceedings{Wang_2026_WACV, author = {Wang, Shikuan and Chen, Yuangong and Gong, Jianzhou and Meng, Lingyi and Wu, Mengquan and Liu, Longxing and Yuan, Haiwei and Guo, Mingbin}, title = {Remote Sensing Forestry Similarity Convolution}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7565-7575} }
Multimodal Graph Representation Learning over Arbitrary Sets of Modalities-
[pdf]
[supp]
[bibtex]@InProceedings{Patapati_2026_WACV, author = {Patapati, Santosh and Srinivasan, Trisanth}, title = {Multimodal Graph Representation Learning over Arbitrary Sets of Modalities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7104-7115} }
Uncertainty-Aware Vision-Language Segmentation for Medical Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Das_2026_WACV, author = {Das, Aryan and Rachamalla, Tanishq and Biswas, Koushik and Roy, Swalpa Kumar and Verma, Vinay Kumar}, title = {Uncertainty-Aware Vision-Language Segmentation for Medical Imaging}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8490-8499} }
SeqFeedNet: Sequential Feature Feedback Network for Background Subtraction-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Yu-Shun and Guo, Jing-Ming and Yang, Yi-Xiang}, title = {SeqFeedNet: Sequential Feature Feedback Network for Background Subtraction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8199-8208} }
Crash2DocAI: Automated Integration of Post-Crash Car Part Images into Technical Reports-
[pdf]
[bibtex]@InProceedings{Divis_2026_WACV, author = {Divis, Vaclav and Giovagnola, Jessica and Ben Chikha, Khalil and Hr\'uz, Marek}, title = {Crash2DocAI: Automated Integration of Post-Crash Car Part Images into Technical Reports}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8272-8281} }
From Prompt to Production: Automating Brand-Safe Marketing Imagery with Text-to-Image Models-
[pdf]
[supp]
[bibtex]@InProceedings{Atighehchian_2026_WACV, author = {Atighehchian, Parmida and Wang, Henry and Kapustin, Andrei and Lerner, Boris and Jiang, Tiancheng and Jensen, Taylor and Sokhandan, Negin}, title = {From Prompt to Production: Automating Brand-Safe Marketing Imagery with Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6818-6826} }
MaxInfo: A Training-Free Key-Frame Selection Method Using Maximum Volume for Enhanced Video Understanding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Pengyi and Abdullaeva, Irina and Gambashidze, Alexander and Kuznetsov, Andrey and Oseledets, Ivan}, title = {MaxInfo: A Training-Free Key-Frame Selection Method Using Maximum Volume for Enhanced Video Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7198-7207} }
SDT-6D: Fully Sparse Depth-Transformer for Staged End-to-End 6D Pose Estimation in Industrial Multi-View Bin Picking-
[pdf]
[bibtex]@InProceedings{Leuze_2026_WACV, author = {Leuze, Nico and Hoh, Maximilian and Do\u{g}an, Samed and R.-Pe\~na, Nicolas and Schoettl, Alfred}, title = {SDT-6D: Fully Sparse Depth-Transformer for Staged End-to-End 6D Pose Estimation in Industrial Multi-View Bin Picking}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8406-8415} }
VideoSketcher: A Training-Free Approach for Coherent Video Sketch Transfer-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Huining and Liu, Bangzhen and Yang, Rui and Zhou, Yang and Xu, Chenshu and Pang, Xufang and He, Shengfeng}, title = {VideoSketcher: A Training-Free Approach for Coherent Video Sketch Transfer}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7333-7343} }
From Darkness to Detail: Frequency-Aware SSMs for Low-Light Vision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Adhikarla_2026_WACV, author = {Adhikarla, Eashan and Zhang, Kai and Chen, Gong and Nicholson, John and Davison, Brian D.}, title = {From Darkness to Detail: Frequency-Aware SSMs for Low-Light Vision}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6956-6967} }
Mean-Shift Distillation for Diffusion Mode Seeking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Thamizharasan_2026_WACV, author = {Thamizharasan, Vikas and Chatzis, Nikitas and Georgiev, Iliyan and Fisher, Matthew and Kalogerakis, Evangelos and Liu, Difan and Zhao, Nanxuan and Luk\'a\v{c}, Michal}, title = {Mean-Shift Distillation for Diffusion Mode Seeking}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6537-6546} }
ISALux: Illumination and Semantics-Aware Transformer Employing Mixture of Experts for Low Light Image Enhancement-
[pdf]
[supp]
[bibtex]@InProceedings{Balmez_2026_WACV, author = {Balmez, Raul and Brateanu, Alexandru and Orhei, Ciprian and Ancuti, Codruta O. and Ancuti, Cosmin}, title = {ISALux: Illumination and Semantics-Aware Transformer Employing Mixture of Experts for Low Light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7862-7872} }
SVS-GAN for Semantic Synthesis of Traffic Videos for Autonomous Driving-
[pdf]
[supp]
[bibtex]@InProceedings{Seyam_2026_WACV, author = {Seyam, Khaled M. and Wiederer, Julian and Braun, Markus and Yang, Bin}, title = {SVS-GAN for Semantic Synthesis of Traffic Videos for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8650-8659} }
Memoire: Learning User Personas from Gallery Tags for Personalized Photo Curation-
[pdf]
[supp]
[bibtex]@InProceedings{Mathur_2026_WACV, author = {Mathur, Praful and Iftekhar, Mohsin and Sharma, Aman and Tiwari, Sarvesh and Deka, Meghali and Cherukuri, Sathish and Sheshadri, K Roopa and Valusa, Rakesh}, title = {Memoire: Learning User Personas from Gallery Tags for Personalized Photo Curation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6873-6882} }
Boosting Unsupervised Video Instance Segmentation with Automatic Quality-Guided Self-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lu_2026_WACV, author = {Lu, Kaixuan and Kaya, Mehmet Onurcan and Papadopoulos, Dim P.}, title = {Boosting Unsupervised Video Instance Segmentation with Automatic Quality-Guided Self-Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7387-7397} }
Test Time Adaptation Using Adaptive Quantile Recalibration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mehrbod_2026_WACV, author = {Mehrbod, Paria and Vianna, Pedro and Nanfack, Geraldin and Wolf, Guy and Belilovsky, Eugene}, title = {Test Time Adaptation Using Adaptive Quantile Recalibration}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5986-5995} }
SceneEval: Evaluating Semantic Coherence in Text-Conditioned 3D Indoor Scene Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tam_2026_WACV, author = {Tam, Hou In Ivan and Pun, Hou In Derek and Wang, Austin T. and Chang, Angel X. and Savva, Manolis}, title = {SceneEval: Evaluating Semantic Coherence in Text-Conditioned 3D Indoor Scene Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7355-7365} }
Rethinking Latent Variable in Learned Image Compression-
[pdf]
[supp]
[bibtex]@InProceedings{Yi_2026_WACV, author = {Yi, Fangzhou and Gong, Zhicheng and Zeng, Hui}, title = {Rethinking Latent Variable in Learned Image Compression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8531-8540} }
MUSE: Model-based Uncertainty-aware Similarity Estimation for zero-shot 2D Object Detection and Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cho_2026_WACV, author = {Cho, Sungmin and Park, Sungbum and Oh, Insoo}, title = {MUSE: Model-based Uncertainty-aware Similarity Estimation for zero-shot 2D Object Detection and Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6090-6100} }
Modeling and Learning Multiple Hypotheses for Monocular 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Hyeonjeong and Xiong, Peixi and Yu, Pei and Tang, Wei}, title = {Modeling and Learning Multiple Hypotheses for Monocular 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7040-7050} }
SD-CSFL: A Synthetic Data-Driven Conformity Scoring Framework for Robust Federated Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Alharbi_2026_WACV, author = {Alharbi, Ebtisaam and Kerim, Abdulrahman and Marcolino, Leandro Soriano and Ni, Qiang}, title = {SD-CSFL: A Synthetic Data-Driven Conformity Scoring Framework for Robust Federated Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6903-6912} }
MedROV: Towards Real-Time Open-Vocabulary Detection Across Diverse Medical Imaging Modalities-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sheikh_2026_WACV, author = {Sheikh, Tooba Tehreem and Lahoud, Jean and Anwer, Rao Muhammad and Khan, Fahad Shahbaz and Khan, Salman and Cholakkal, Hisham}, title = {MedROV: Towards Real-Time Open-Vocabulary Detection Across Diverse Medical Imaging Modalities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8628-8638} }
Towards Unconstrained Cross-View Pose Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Wollam_2026_WACV, author = {Wollam, Alexander and Ashley, Kyle and Shugaev, Maxim and Arend, Oliver and Semenov, Ilya and Dashtestani, Hadis and Ravi, Sumved and Jacobs, Nathan}, title = {Towards Unconstrained Cross-View Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8448-8457} }
FocalComm: Hard Instance-Aware Multi-Agent Perception-
[pdf]
[arXiv]
[bibtex]@InProceedings{Shenkut_2026_WACV, author = {Shenkut, Dereje and Bhagavatula, Vijayakumar}, title = {FocalComm: Hard Instance-Aware Multi-Agent Perception}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6277-6286} }
Video and Language Alignment in 2D Systems for 3D Multi-object Scenes with Multi-Information Derivative-Free Control-
[pdf]
[supp]
[bibtex]@InProceedings{Armitage_2026_WACV, author = {Armitage, Jason and Sennrich, Rico}, title = {Video and Language Alignment in 2D Systems for 3D Multi-object Scenes with Multi-Information Derivative-Free Control}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6266-6276} }
GaussianHeadTalk: Wobble-Free 3D Talking Heads with Audio Driven Gaussian Splatting-
[pdf]
[supp]
[bibtex]@InProceedings{Agarwal_2026_WACV, author = {Agarwal, Madhav and Zhang, Mingtian and Sevilla-Lara, Laura and McDonagh, Steven}, title = {GaussianHeadTalk: Wobble-Free 3D Talking Heads with Audio Driven Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8017-8027} }
SVD-Det: A Lightweight Framework for Video Forgery Detection Using Semantic and Visual Defect Cues-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2026_WACV, author = {Yang, Tsung-Shan and Zhang, Tianyu and Qian, Feng and Yan, Bing and Kuo, C.-C. Jay}, title = {SVD-Det: A Lightweight Framework for Video Forgery Detection Using Semantic and Visual Defect Cues}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7616-7625} }
FastHMR: Accelerating Human Mesh Recovery via Token and Layer Merging with Diffusion Decoding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mehraban_2026_WACV, author = {Mehraban, Soroush and Iaboni, Andrea and Taati, Babak}, title = {FastHMR: Accelerating Human Mesh Recovery via Token and Layer Merging with Diffusion Decoding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6733-6743} }
See, Think, Learn: A Self-Taught Multimodal Reasoner-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sharma_2026_WACV, author = {Sharma, Sourabh and Gupta, Sonam and Sadbhawna, Sadbhawna}, title = {See, Think, Learn: A Self-Taught Multimodal Reasoner}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8313-8322} }
CSF-Net: Context-Semantic Fusion Network for Large Mask Inpainting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Heo_2026_WACV, author = {Heo, Chae-Yeon and Cho, Yeong-Jun}, title = {CSF-Net: Context-Semantic Fusion Network for Large Mask Inpainting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8292-8301} }
Virtually Unrolling the Herculaneum Papyri by Diffeomorphic Spiral Fitting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Henderson_2026_WACV, author = {Henderson, Paul}, title = {Virtually Unrolling the Herculaneum Papyri by Diffeomorphic Spiral Fitting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6401-6411} }
Exploring the Boundaries of Diffusion Models for Offline Writer Identification with Sparse and Intra-Variable Data-
[pdf]
[supp]
[bibtex]@InProceedings{Dey_2026_WACV, author = {Dey, Aritra and Adak, Chandranath and Priya, Kumari and Chattopadhyay, Soumi and Chanda, Sukalpa}, title = {Exploring the Boundaries of Diffusion Models for Offline Writer Identification with Sparse and Intra-Variable Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7178-7187} }
Hierarchical Instance Tracking to Balance Privacy Preservation with Accessible Information-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Prasad_2026_WACV, author = {Prasad, Neelima and Reynolds, Jarek and Karsanbhai, Neel and Sharma, Tanusree and Zhang, Lotus and Stangl, Abigale and Wang, Yang and Findlater, Leah and Gurari, Danna}, title = {Hierarchical Instance Tracking to Balance Privacy Preservation with Accessible Information}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5945-5955} }
Photo Dating by Facial Age Aggregation-
[pdf]
[supp]
[bibtex]@InProceedings{Paplham_2026_WACV, author = {Paplh\'am, Jakub and Franc, Vojt\v{e}ch}, title = {Photo Dating by Facial Age Aggregation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8103-8112} }
Test-Time Consistency in Vision Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chou_2026_WACV, author = {Chou, Shih-Han and Chandhok, Shivam and Little, James J. and Sigal, Leonid}, title = {Test-Time Consistency in Vision Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7789-7798} }
CSGaussian: Progressive Rate-Distortion Compression and Segmentation for 3D Gaussian Splatting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tseng_2026_WACV, author = {Tseng, Yu-Jen and Kao, Chia-Hao and Chen, Jing-Zhong and Gnutti, Alessandro and Lo, Shao-Yuan and Lin, Yen-Yu and Peng, Wen-Hsiao}, title = {CSGaussian: Progressive Rate-Distortion Compression and Segmentation for 3D Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6883-6892} }
Conversational Image Generation: Towards Multi-Round Personalized Generation with Multi-Modal Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Haochen and Sinha, Animesh and Juefei-Xu, Felix and Ma, Haoyu and Li, Kunpeng and Fan, Zhipeng and Dai, Xiaoliang and Hou, Tingbo and Zhang, Peizhao and He, Zecheng}, title = {Conversational Image Generation: Towards Multi-Round Personalized Generation with Multi-Modal Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8282-8291} }
PhyEduVideo: A Benchmark for Evaluating Text-to-Video Models for Physics Education-
[pdf]
[supp]
[bibtex]@InProceedings{K.M_2026_WACV, author = {K.M, Megha Mariam and Arun, Aditya and Laskar, Zakaria and Jawahar, C.V.}, title = {PhyEduVideo: A Benchmark for Evaluating Text-to-Video Models for Physics Education}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8690-8699} }
PEaRL: Pathway-Enhanced Representation Learning for Gene and Pathway Expression Prediction from Histology-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Majumder_2026_WACV, author = {Majumder, Sejuti and Kapse, Saarthak and Bhattacharya, Moinak and Xu, Xuan and Yurovsky, Alisa and Prasanna, Prateek}, title = {PEaRL: Pathway-Enhanced Representation Learning for Gene and Pathway Expression Prediction from Histology}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8052-8062} }
FastPose-ViT: A Vision Transformer for Real-Time Spacecraft Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ancey_2026_WACV, author = {Ancey, Pierre and Price, Andrew and Javed, Saqib and Salzmann, Mathieu}, title = {FastPose-ViT: A Vision Transformer for Real-Time Spacecraft Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7873-7882} }
Improvise, Adapt, Overcome -- Telescopic Adapters for Efficient Fine-tuning of Vision Language Models in Medical Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mishra_2026_WACV, author = {Mishra, Ujjwal and Shukla, Vinita and Hambarde, Praful and Shukla, Amit}, title = {Improvise, Adapt, Overcome -- Telescopic Adapters for Efficient Fine-tuning of Vision Language Models in Medical Imaging}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7605-7615} }
Zero-LEAD: Source-Free Universal Domain Adaptation for Abdominal Multi-Organ Segmentation-
[pdf]
[bibtex]@InProceedings{El-Sayed_2026_WACV, author = {El-Sayed, Ahmed and Torki, Marwan}, title = {Zero-LEAD: Source-Free Universal Domain Adaptation for Abdominal Multi-Organ Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6715-6723} }
Dual-Domain Multimodal Hyperbolic Fusion for Cardiopulmonary Disease Diagnosis in Emergency Care-
[pdf]
[bibtex]@InProceedings{Nan_2026_WACV, author = {Nan, Ke and Samaan, Maggie and Burns, Benjamin and Ning, Xia and Han, Yuchi and Xue, Yuan}, title = {Dual-Domain Multimodal Hyperbolic Fusion for Cardiopulmonary Disease Diagnosis in Emergency Care}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8700-8710} }
Procedure Learning via Regularized Gromov-Wasserstein Optimal Transport-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mahmood_2026_WACV, author = {Mahmood, Syed Ahmed and Ali, Ali Shah and Ahmed, Umer and Fateh, Fawad Javed and Zia, M. Zeeshan and Tran, Quoc-Huy}, title = {Procedure Learning via Regularized Gromov-Wasserstein Optimal Transport}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6925-6935} }
PDV: Prompt Directional Vectors for Zero-shot Composed Image Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tursun_2026_WACV, author = {Tursun, Osman and Kalkan, Sinan and Denman, Simon and Fookes, Clinton}, title = {PDV: Prompt Directional Vectors for Zero-shot Composed Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7740-7749} }
Any Detector Can Detect Anything-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Thomas E. and Li, Siyuan and Danelljan, Martin and Ding, Henghui and Van Gool, Luc and Yu, Fisher}, title = {Any Detector Can Detect Anything}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8437-8447} }
Automated Suturing Skill Assessment in Robot-assisted Surgery from Endoscopic Videos using Clinically-guided Evaluation Criteria-
[pdf]
[bibtex]@InProceedings{Deo_2026_WACV, author = {Deo, Atharva Sunil and Pasupulety, Ujjwal and Matsumoto, Nicholas and Moran, Jay and Yang, Cherine and Kim, Jeanine and Kocielnik, Rafal Dariusz and Naser-Tavakolian, Aurash and Hung, Andrew}, title = {Automated Suturing Skill Assessment in Robot-assisted Surgery from Endoscopic Videos using Clinically-guided Evaluation Criteria}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7218-7228} }
Polymorph: Energy-Efficient Multi-Label Classification for Video Streams on Embedded Devices-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ghafouri_2026_WACV, author = {Ghafouri, Saeid and Fayyaz, Mohsen and Li, Xiangchen and John, Deepu and Ji, Bo and Nikolopoulos, Dimitrios S. and Vandierendonck, Hans}, title = {Polymorph: Energy-Efficient Multi-Label Classification for Video Streams on Embedded Devices}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6432-6441} }
VectorSynth: Fine-Grained Satellite Image Synthesis with Structured Semantics-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cher_2026_WACV, author = {Cher, Daniel and Wei, Brian and Sastry, Srikumar and Jacobs, Nathan}, title = {VectorSynth: Fine-Grained Satellite Image Synthesis with Structured Semantics}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7019-7029} }
DiffRegCD: Integrated Registration and Change Detection with Diffusion Features-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Madani_2026_WACV, author = {Madani, Seyedehanita and Chellappa, Rama and Patel, Vishal M.}, title = {DiffRegCD: Integrated Registration and Change Detection with Diffusion Features}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7503-7512} }
LangPose: Language-Aligned Motion for Robust 3D Human Pose Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liao_2026_WACV, author = {Liao, Longyun and Zheng, Rong}, title = {LangPose: Language-Aligned Motion for Robust 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8073-8083} }
CLIP-UP: CLIP-Based Unanswerable Problem Detection for Visual Question Answering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Vardi_2026_WACV, author = {Vardi, Ben and Nir, Oron and Shamir, Ariel}, title = {CLIP-UP: CLIP-Based Unanswerable Problem Detection for Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5898-5908} }
Beyond Paired Data: Self-Supervised UAV Geo-Localization from Reference Imagery Alone-
[pdf]
[supp]
[bibtex]@InProceedings{Amadei_2026_WACV, author = {Amadei, Tristan and Meinhardt-Llopis, Enric and Bascle, Benedicte and Abgrall, Corentin and Facciolo, Gabriele}, title = {Beyond Paired Data: Self-Supervised UAV Geo-Localization from Reference Imagery Alone}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7409-7419} }
Training-Free Few-Shot Segmentation via Vision-Language Guided Prompting-
[pdf]
[bibtex]@InProceedings{Yoon_2026_WACV, author = {Yoon, Euihyun and Park, Taejin and Lee, Jaekoo}, title = {Training-Free Few-Shot Segmentation via Vision-Language Guided Prompting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6517-6526} }
HDR Reconstruction Boosting with Training-Free and Exposure-Consistent Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Lin_2026_WACV, author = {Lin, Yo-Tin and Chen, Su-Kai and Hu, Hou-Ning and Lin, Yen-Yu and Liu, Yu-Lun}, title = {HDR Reconstruction Boosting with Training-Free and Exposure-Consistent Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7513-7523} }
Exploring Automated Recognition of Instructional Activity and Discourse from Multimodal Classroom Data-
[pdf]
[supp]
[bibtex]@InProceedings{Bueno_2026_WACV, author = {Bueno, Ivo and Hou, Ruikun and B\"uhler, Babette and F\"utterer, Tim and Drimalla, James and Foster, Jonathan K. and Youngs, Peter and Gerjets, Peter and Trautwein, Ulrich and Kasneci, Enkelejda}, title = {Exploring Automated Recognition of Instructional Activity and Discourse from Multimodal Classroom Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6806-6817} }
SCAdapter: Content-Style Disentanglement for Diffusion Style Transfer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Trinh_2026_WACV, author = {Trinh, Luan Thanh}, title = {SCAdapter: Content-Style Disentanglement for Diffusion Style Transfer}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7312-7321} }
Equivariant Sampling for Improving Diffusion Model-based Image Restoration-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wu_2026_WACV, author = {Wu, Chenxu and Kong, Qingpeng and Zhao, Peiang and Yang, Wendi and Ma, Wenxin and Tang, Fenghe and Jiang, Zihang and Zhou, S.Kevin}, title = {Equivariant Sampling for Improving Diffusion Model-based Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6827-6839} }
AuViRe: Audio-visual Speech Representation Reconstruction for Deepfake Temporal Localization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Koutlis_2026_WACV, author = {Koutlis, Christos and Papadopoulos, Symeon}, title = {AuViRe: Audio-visual Speech Representation Reconstruction for Deepfake Temporal Localization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7168-7177} }
Predicting Task fMRI Contrasts from Resting-State fMRI Using Sparse 3D Convolutions-
[pdf]
[bibtex]@InProceedings{Sviridov_2026_WACV, author = {Sviridov, Ivan and Boyko, Maria and Sharaev, Maksim}, title = {Predicting Task fMRI Contrasts from Resting-State fMRI Using Sparse 3D Convolutions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6320-6329} }
Causality-Driven Audits of Model Robustness-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Drenkow_2026_WACV, author = {Drenkow, Nathan and Paul, William and Ribaudo, Chris and Unberath, Mathias}, title = {Causality-Driven Audits of Model Robustness}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5956-5966} }
Pointmap-Conditioned Diffusion for Consistent Novel View Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Thang-Anh-Quan and Caraffa, Laurent and Tarel, Jean-Philippe and Br\'emond, Roland}, title = {Pointmap-Conditioned Diffusion for Consistent Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6360-6370} }
Reciprocal Teaching: Dynamic Multi-Model Teacher-Student Learning for Multiple Noisy Annotations-
[pdf]
[supp]
[bibtex]@InProceedings{Ai_2026_WACV, author = {Ai, Wenjie and Nguyen, Cuong C. and Hilton, Adrian and Carneiro, Gustavo}, title = {Reciprocal Teaching: Dynamic Multi-Model Teacher-Student Learning for Multiple Noisy Annotations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8376-8385} }
RampWatch: An In-the-Wild Dataset and Text-Guided Detection Framework for Recreational Vessels-
[pdf]
[supp]
[bibtex]@InProceedings{Asim_2026_WACV, author = {Asim, Malik Muhammad and Smallwood, Claire B. and Tariq, Abdullah and Lo, Johnny and Gilani, Syed Zulqarnain}, title = {RampWatch: An In-the-Wild Dataset and Text-Guided Detection Framework for Recreational Vessels}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7576-7585} }
Q-Former Autoencoder: A Modern Framework for Medical Anomaly Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dalmonte_2026_WACV, author = {Dalmonte, Francesco and Bayar, Emirhan and Akbas, Emre and Georgescu, Mariana-Iuliana}, title = {Q-Former Autoencoder: A Modern Framework for Medical Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7985-7995} }
MoSCo: Real-time and Efficient Text-to-Motion Synthesis via Delta Training-
[pdf]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Zhiyuan and Liu, Lingqiao}, title = {MoSCo: Real-time and Efficient Text-to-Motion Synthesis via Delta Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6298-6308} }
Splannequin: Freezing Monocular Mannequin-Challenge Footage with Dual-Detection Splatting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chien_2026_WACV, author = {Chien, Hao-Jen and Huang, Yi-Chuan and Wu, Chung-Ho and Chao, Wei-Lun and Liu, Yu-Lun}, title = {Splannequin: Freezing Monocular Mannequin-Challenge Footage with Dual-Detection Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8028-8040} }
Hybrid State Representation for Video Procedure Planning-
[pdf]
[supp]
[bibtex]@InProceedings{Choi_2026_WACV, author = {Choi, Woo Suk and Jang, Youwon and Lee, Minsu and Zhang, Byoung-Tak}, title = {Hybrid State Representation for Video Procedure Planning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6507-6516} }
Diagnose Like A REAL Pathologist: An Uncertainty-Focused Approach for Trustworthy Multi-Resolution Multiple Instance Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hong_2026_WACV, author = {Hong, Sungrae and Lee, Sol and Shin, Jisu and Jeong, Jiwon and Yi, Mun Yong}, title = {Diagnose Like A REAL Pathologist: An Uncertainty-Focused Approach for Trustworthy Multi-Resolution Multiple Instance Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6132-6141} }
Align Video Diffusion Model with Online Video-Centric Preference Optimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2026_WACV, author = {Zhang, Jiacheng and Wu, Jie and Chen, Weifeng and Ji, Yatai and Xiao, Xuefeng and Huang, Weilin and Han, Kai}, title = {Align Video Diffusion Model with Online Video-Centric Preference Optimization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6142-6152} }
AortaDiff: A Unified Multitask Diffusion Framework for Contrast-Free AAA Imaging-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ou_2026_WACV, author = {Ou, Yuxuan and Bi, Ning and Pan, Jiazhen and Yang, Jiancheng and Yu, Boliang and Zidan, Usama and Lee, Regent and Grau, Vicente}, title = {AortaDiff: A Unified Multitask Diffusion Framework for Contrast-Free AAA Imaging}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8242-8251} }
High-Level Semantics and Low-Level Features Fusion for Multi-Scale Object Detection in Dynamic Construction Environments-
[pdf]
[bibtex]@InProceedings{Bonyani_2026_WACV, author = {Bonyani, Mahdi and Soleymani, Maryam and Wang, Chao}, title = {High-Level Semantics and Low-Level Features Fusion for Multi-Scale Object Detection in Dynamic Construction Environments}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6527-6536} }
AusSmoke meets MultiNatSmoke: a fully-labelled diverse smoke segmentation dataset-
[pdf]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Weihao and Zhao, Hongjin and Zhu, Gao and Ji, Ge-Peng and Wilson, Nicholas and Yebra, Marta and Barnes, Nick}, title = {AusSmoke meets MultiNatSmoke: a fully-labelled diverse smoke segmentation dataset}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7996-8006} }
MVAT: Multi-View Aware Teacher for Weakly Supervised 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Lahlali_2026_WACV, author = {Lahlali, Saad and Fournier-Mongieux, Alexandre and Granger, Nicolas and Le Borgne, Herv\'e and Pham, Quoc-Cuong}, title = {MVAT: Multi-View Aware Teacher for Weakly Supervised 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6101-6110} }
DreamCatcher: Efficient Multi-Concept Customization via Representation Finetuning-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Jungwon and Lee, Changhun and Park, Eunhyeok}, title = {DreamCatcher: Efficient Multi-Concept Customization via Representation Finetuning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7062-7072} }
GorillaWatch: An Automated System for In-the-Wild Gorilla Re-Identification and Population Monitoring-
[pdf]
[bibtex]@InProceedings{Schall_2026_WACV, author = {Schall, Maximilian and Kn\"ofel, Felix Leonard and K\"onig, Noah Elias and Kubeler, Jan Jonas and von Klinski, Maximilian and Linnemann, Joan Wilhelm and Liu, Xiaoshi and Schlegelmilch, Iven Jelle and Woyciniuk, Ole and Schild, Alexandra and Wasmuht, Dante and Espinet, Magdalena Bermejo and Basas, German Illera and de Melo, Gerard}, title = {GorillaWatch: An Automated System for In-the-Wild Gorilla Re-Identification and Population Monitoring}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8364-8375} }
CLoCKDistill: Consistent Location and Context aware Knowledge Distillation for DETRs-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lan_2026_WACV, author = {Lan, Qizhen and Tian, Qing}, title = {CLoCKDistill: Consistent Location and Context aware Knowledge Distillation for DETRs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7188-7197} }
NAPP: Noise-Adaptive Prototype Perturbation for Few-Shot Learning-
[pdf]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Ilhwan and Yun, Sangwoo and Lee, Dongheon and Kim, Seongsu and Paik, Joonki}, title = {NAPP: Noise-Adaptive Prototype Perturbation for Few-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8007-8016} }
MemeTAG: Keyword-Driven Meme Classification through Tag Embedding Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Sharma_2026_WACV, author = {Sharma, Akshit and Patil, Prashant W}, title = {MemeTAG: Keyword-Driven Meme Classification through Tag Embedding Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7679-7688} }
Hymavi : A Hybrid Mamba-Attention Network in Multi-View Framework for Volumetric Medical Image Segmentation-
[pdf]
[bibtex]@InProceedings{Tran_2026_WACV, author = {Tran, Sy Dat and Gahm, Jin Kyu}, title = {Hymavi : A Hybrid Mamba-Attention Network in Multi-View Framework for Volumetric Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6006-6015} }
DocWaveDiff: A Predict-and-Refine approach for Document Image Enhancement with Wavelet U-Nets and Diffusion models-
[pdf]
[supp]
[bibtex]@InProceedings{Marulli_2026_WACV, author = {Marulli, Matteo and Bertini, Marco}, title = {DocWaveDiff: A Predict-and-Refine approach for Document Image Enhancement with Wavelet U-Nets and Diffusion models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8511-8520} }
ODEt(ODEl): Shortcutting the Time and the Length in Diffusion and Flow Models for Faster Sampling-
[pdf]
[supp]
[bibtex]@InProceedings{Gudovskiy_2026_WACV, author = {Gudovskiy, Denis and Zheng, Wenzhao and Okuno, Tomoyuki and Nakata, Yohei and Keutzer, Kurt}, title = {ODEt(ODEl): Shortcutting the Time and the Length in Diffusion and Flow Models for Faster Sampling}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6111-6120} }
Can Image Splicing and Copy-Move Forgery Be Detected by the Same Model? Forensim: An Attention-Based State-Space Approach-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nandi_2026_WACV, author = {Nandi, Soumyaroop and Natarajan, Prem}, title = {Can Image Splicing and Copy-Move Forgery Be Detected by the Same Model? Forensim: An Attention-Based State-Space Approach}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6194-6204} }
TopoRec: Point Cloud Recognition Using Topological Data Analysis-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ghosh_2026_WACV, author = {Ghosh, Anirban and Kulbaka, Iliya and Dahlin, Ian and Dutta, Ayan}, title = {TopoRec: Point Cloud Recognition Using Topological Data Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7544-7553} }
SFMNet: Sparse Focal Modulation for 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shrout_2026_WACV, author = {Shrout, Oren and Tal, Ayellet}, title = {SFMNet: Sparse Focal Modulation for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6287-6297} }
Multi-Grained Text-Guided Image Fusion for Multi-Exposure and Multi-Focus Scenarios-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tang_2026_WACV, author = {Tang, Mingwei and Nie, Jiahao and Yang, Guang and Cui, Ziqing and Li, Jie}, title = {Multi-Grained Text-Guided Image Fusion for Multi-Exposure and Multi-Focus Scenarios}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7668-7678} }
F-INR: Functional Tensor Decomposition for Implicit Neural Representations-
[pdf]
[supp]
[bibtex]@InProceedings{Vemuri_2026_WACV, author = {Vemuri, Sai Karthikeya and B\"uchner, Tim and Denzler, Joachim}, title = {F-INR: Functional Tensor Decomposition for Implicit Neural Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6557-6568} }
Understanding the Visual Projection Space of Multimodal LLMs-
[pdf]
[bibtex]@InProceedings{Jeong_2026_WACV, author = {Jeong, Sungheon and Song, Yoojeong and Kim, Hyungjoon}, title = {Understanding the Visual Projection Space of Multimodal LLMs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6049-6058} }
Flood-LDM: Generalizable Latent Diffusion Models for rapid and accurate zero-shot High-Resolution Flood Mapping-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Neo_2026_WACV, author = {Neo, Sun Han and Seneviratne, Sachith and Herath, Herath Mudiyanselage Viraj Vidura Herath and Saha, Abhishek and Rasnayaka, Sanka and Marshall, Lucy Amanda}, title = {Flood-LDM: Generalizable Latent Diffusion Models for rapid and accurate zero-shot High-Resolution Flood Mapping}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8063-8072} }
PerVL-Bench: Benchmarking Multimodal Personalization for Large Vision-Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Minsung}, title = {PerVL-Bench: Benchmarking Multimodal Personalization for Large Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6696-6704} }
OSEG: Improving Diffusion sampling through Orthogonal Smoothed Energy Guidance-
[pdf]
[supp]
[bibtex]@InProceedings{Fahim_2026_WACV, author = {Fahim, Masud An Nur Islam and Saqib, Nazmus and Gil, Joon-Min}, title = {OSEG: Improving Diffusion sampling through Orthogonal Smoothed Energy Guidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5996-6005} }
Motion-Aware Graph Fusion Network for 3D Human Pose Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Pham_2026_WACV, author = {Pham, Yen and Yuan, Xiaohui and Zhuang, Chengyuan}, title = {Motion-Aware Graph Fusion Network for 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5798-5808} }
Graph Query Networks for Object Detection with Automotive Radar-
[pdf]
[arXiv]
[bibtex]@InProceedings{Saini_2026_WACV, author = {Saini, Loveneet and Tercan, Hasan and Meisen, Tobias}, title = {Graph Query Networks for Object Detection with Automotive Radar}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6988-6997} }
GroupPortrait: Multi-ID Portrait Generation with High Identity Preservation and Fine-Grained Control-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2026_WACV, author = {Huang, Meijia and Li, Ruida and Ma, Bing and Jiang, Liangwei and Fang, Shuo and Ma, Chenguang}, title = {GroupPortrait: Multi-ID Portrait Generation with High Identity Preservation and Fine-Grained Control}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6226-6235} }
FAIR-SIGHT: Fairness Assurance in Image Recognition via Simultaneous Conformal Thresholding and Dynamic Output Repair-
[pdf]
[arXiv]
[bibtex]@InProceedings{Fayyazi_2026_WACV, author = {Fayyazi, Arya and Kamal, Mehdi and Pedram, Massoud}, title = {FAIR-SIGHT: Fairness Assurance in Image Recognition via Simultaneous Conformal Thresholding and Dynamic Output Repair}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6633-6642} }
T2LF: LLM-Guided Multimodal Diffusion for Text-to-Light Field Synthesis-
[pdf]
[supp]
[bibtex]@InProceedings{Yoon_2026_WACV, author = {Yoon, Soyoung and Ahn, Namhyuk and Park, In Kyu}, title = {T2LF: LLM-Guided Multimodal Diffusion for Text-to-Light Field Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7322-7332} }
Training-free Conditional Image Embedding Framework Leveraging Large Vision Language Models-
[pdf]
[supp]
[bibtex]@InProceedings{Kawarada_2026_WACV, author = {Kawarada, Masayuki and Yamada, Kosuke and Tejero-de-Pablos, Antonio and Inoue, Naoto}, title = {Training-free Conditional Image Embedding Framework Leveraging Large Vision Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7636-7646} }
General and Domain-Specific Zero-shot Detection of Generated Images via Conditional Likelihood-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Betser_2026_WACV, author = {Betser, Roy and Hofman, Omer and Vainshtein, Roman and Gilboa, Guy}, title = {General and Domain-Specific Zero-shot Detection of Generated Images via Conditional Likelihood}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7809-7820} }
MM-TS: Multi-Modal Temperature and Margin Schedules for Contrastive Learning with Long-Tail Data-
[pdf]
[supp]
[bibtex]@InProceedings{Sheludzko_2026_WACV, author = {Sheludzko, Siarhei and Duka, Dhimitrios and Schiele, Bernt and Kuehne, Hilde and Kukleva, Anna}, title = {MM-TS: Multi-Modal Temperature and Margin Schedules for Contrastive Learning with Long-Tail Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7376-7386} }
VitaGlyph: Vitalizing Artistic Typography with Flexible Dual-branch Diffusion Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Feng_2026_WACV, author = {Feng, Kailai and Zhang, Yabo and Yu, Haodong and Ji, Zhilong and Bai, Jinfeng and Zhang, Hongzhi and Zuo, Wangmeng}, title = {VitaGlyph: Vitalizing Artistic Typography with Flexible Dual-branch Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8220-8230} }
GHOST: Getting to the Bottom of Hallucinations with A Multi-round Consistency Benchmark-
[pdf]
[supp]
[bibtex]@InProceedings{VS_2026_WACV, author = {VS, Vibashan and Chang, Nadine and Schmalfuss, Jenny and Patel, Vishal M. and Yu, Zhiding and Alvarez, Jose M.}, title = {GHOST: Getting to the Bottom of Hallucinations with A Multi-round Consistency Benchmark}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6163-6173} }
Optimizing against Infeasible Inclusions from Data for Semantic Segmentation through Morphology-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Basu_2026_WACV, author = {Basu, Shamik and Van Gool, Luc and Sakaridis, Christos}, title = {Optimizing against Infeasible Inclusions from Data for Semantic Segmentation through Morphology}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7524-7533} }
Zero-Shot Audio-Visual Editing via Cross-Modal Delta Denoising-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2026_WACV, author = {Lin, Yan-Bo and Lin, Kevin and Yang, Zhengyuan and Li, Linjie and Wang, Jianfeng and Lin, Chung-Ching and Wang, Xiaofei and Bertasius, Gedas and Wang, Lijuan}, title = {Zero-Shot Audio-Visual Editing via Cross-Modal Delta Denoising}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7344-7354} }
D2Mamba: Dual Domain Guided Informed Search in State Space Model for Underwater Image Enhancement-
[pdf]
[supp]
[bibtex]@InProceedings{Pramanick_2026_WACV, author = {Pramanick, Alik and Roy, Soumajit and Sur, Arijit}, title = {D2Mamba: Dual Domain Guided Informed Search in State Space Model for Underwater Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7126-7136} }
TM-Adapter: Temporal Merge Adapter for Efficient Global Temporal Modeling-
[pdf]
[supp]
[bibtex]@InProceedings{Hahm_2026_WACV, author = {Hahm, Woo Joo and Jang, Seungwoo and Kim, Hyeon Tak and Lee, Daeun and Kim, Kwangsu}, title = {TM-Adapter: Temporal Merge Adapter for Efficient Global Temporal Modeling}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6121-6131} }
Guiding What Not to Generate: Automated Negative Prompting for Text-Image Alignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Sangha and Kim, Eunji and Oh, Yeongtak and Choi, Jooyoung and Yoon, Sungroh}, title = {Guiding What Not to Generate: Automated Negative Prompting for Text-Image Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6664-6675} }
LASER: Lip Landmark Assisted Speaker Detection for Robustness-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Le Thien Phuc and Yu, Zhuoran and Lee, Yong Jae}, title = {LASER: Lip Landmark Assisted Speaker Detection for Robustness}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7291-7300} }
SpecGen: Neural Spectral BRDF Generation via Spectral-Spatial Tri-plane Aggregation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jin_2026_WACV, author = {Jin, Zhenyu and Li, Wenjie and Ma, Zhanyu and Guo, Heng}, title = {SpecGen: Neural Spectral BRDF Generation via Spectral-Spatial Tri-plane Aggregation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8323-8332} }
A Unified Diffusion-Based Framework for Multi-Agent Trajectory Prediction Integrating Structured Multi-Modal Representations-
[pdf]
[bibtex]@InProceedings{Yang_2026_WACV, author = {Yang, Chenxi and Xi, Suyang and Ding, Hong and Shen, Yiqing and Liu, Yunhao}, title = {A Unified Diffusion-Based Framework for Multi-Agent Trajectory Prediction Integrating Structured Multi-Modal Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6442-6452} }
IMPACT: Interpretable Most Important Person Analysis and Classification using Transformer-based Models-
[pdf]
[supp]
[bibtex]@InProceedings{Rampuria_2026_WACV, author = {Rampuria, Akshat and Nayak, Kamakshya Prasad and Thakare, Kamalakar Vijay and Joshi, Tushar and Singh, Aditya Dhananjay and Park, Haesol and Choi, Heeseung and Dogra, Debi Prosad and Kim, Ig-Jae}, title = {IMPACT: Interpretable Most Important Person Analysis and Classification using Transformer-based Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8179-8187} }
HOLO: Holistic Lightweight Optimization for Scene Understanding with Auto-Annotation and Multimodal Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Hu_2026_WACV, author = {Hu, Xiaoyun and Yan, Xiaohan and Wang, Nan and Wei, Gang and Wang, Zhicheng}, title = {HOLO: Holistic Lightweight Optimization for Scene Understanding with Auto-Annotation and Multimodal Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7719-7729} }
UniVid: Unifying Vision Tasks with Pre-trained Video Generation Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Lan and Gu, Yuchao and Mao, Qi}, title = {UniVid: Unifying Vision Tasks with Pre-trained Video Generation Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6754-6763} }
MedPEFT-CL: Dual-Phase Parameter-Efficient Continual Learning with Medical Semantic Adapter and Bidirectional Memory Consolidation-
[pdf]
[bibtex]@InProceedings{Gao_2026_WACV, author = {Gao, Ziyuan and Morel, Philippe}, title = {MedPEFT-CL: Dual-Phase Parameter-Efficient Continual Learning with Medical Semantic Adapter and Bidirectional Memory Consolidation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7699-7708} }
ZebraPose: Zebra Detection and Pose Estimation using only Synthetic Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bonetto_2026_WACV, author = {Bonetto, Elia and Ahmad, Aamir}, title = {ZebraPose: Zebra Detection and Pose Estimation using only Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6611-6620} }
DM3Net: Dual-Camera Super-Resolution via Domain Modulation and Multi-scale Matching-
[pdf]
[supp]
[bibtex]@InProceedings{Guan_2026_WACV, author = {Guan, Cong and Ying, Jiacheng and Ieiri, Yuya and Yoshie, Osamu}, title = {DM3Net: Dual-Camera Super-Resolution via Domain Modulation and Multi-scale Matching}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7472-7481} }
Distilling What and Why: Enhancing Driver Intention Prediction with MLLMs-
[pdf]
[supp]
[bibtex]@InProceedings{Artham_2026_WACV, author = {Artham, Sainithin and Dasgupta, Avijit and Gangisetty, Shankar and Jawahar, C.V.}, title = {Distilling What and Why: Enhancing Driver Intention Prediction with MLLMs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7281-7290} }
Diffusion-Based Action Recognition Generalizes to Untrained Domains-
[pdf]
[supp]
[bibtex]@InProceedings{Guimaraes_2026_WACV, author = {Guimar\~aes, Rog\'erio and Xiao, Frank and Perona, Pietro and Marks, Markus}, title = {Diffusion-Based Action Recognition Generalizes to Untrained Domains}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5919-5933} }
EVTP-IVS: Effective Visual Token Pruning For Unifying Instruction Visual Segmentation In Multi-Modal Large Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhu_2026_WACV, author = {Zhu, Wenhui and Chen, Xiwen and Wang, Zhipeng and Tang, Shao and Ghosh, Sayan and Dong, Xuanzhao and Koner, Rajat and Wang, Yalin}, title = {EVTP-IVS: Effective Visual Token Pruning For Unifying Instruction Visual Segmentation In Multi-Modal Large Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7158-7167} }
ReFineVQA: Iterative Refinement of Video Description via Feedback Generation for Video Question Answering-
[pdf]
[supp]
[bibtex]@InProceedings{Shin_2026_WACV, author = {Shin, Jeongwan and Hur, Chan and Cho, Seongmin and Choi, Jaeho and Park, Hyeyoung}, title = {ReFineVQA: Iterative Refinement of Video Description via Feedback Generation for Video Question Answering}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7647-7657} }
DUDA: Distilled Unsupervised Domain Adaptation for Lightweight Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kang_2026_WACV, author = {Kang, Beomseok and Mithun, Niluthpol Chowdhury and Rajvanshi, Abhinav and Chiu, Han-Pang and Samarasekera, Supun}, title = {DUDA: Distilled Unsupervised Domain Adaptation for Lightweight Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8124-8135} }
OPFormer: Object Pose Estimation Leveraging Foundation Model with Geometric Encoding-
[pdf]
[supp]
[bibtex]@InProceedings{Moroz_2026_WACV, author = {Moroz, Artem and Zeman, V{\'\i}t and Mik\v{s}{\'\i}k, Martin and Isianova, Elizaveta and David, Miroslav and Burget, Pavel and Burde, Varun}, title = {OPFormer: Object Pose Estimation Leveraging Foundation Model with Geometric Encoding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6621-6632} }
Enhancing Reverse Distillation with Core Exemplar Learning for Unified Multi-Class Anomaly Detection-
[pdf]
[bibtex]@InProceedings{Lim_2026_WACV, author = {Lim, Heechul and Kim, Min-Soo and Lee, Hyun-Boo and Kang, Suk-Ju and Chon, Kang-Wook and Lee, Haeyun}, title = {Enhancing Reverse Distillation with Core Exemplar Learning for Unified Multi-Class Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7586-7595} }
Joint Optimization of Camera Model and Deep Neural Network for Image Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Noboru_2026_WACV, author = {Noboru, Youta and Ozasa, Yuko and Tanaka, Masayuki}, title = {Joint Optimization of Camera Model and Deep Neural Network for Image Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7626-7635} }
DirectDrag: High-Fidelity, Mask-Free, Prompt-Free Drag-based Image Editing via Readout-Guided Feature Alignment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liao_2026_WACV, author = {Liao, Sheng-Hao and Chen, Shang-Fu and Huang, Tai-Ming and Cheng, Wen-Huang and Hua, Kai-Lung}, title = {DirectDrag: High-Fidelity, Mask-Free, Prompt-Free Drag-based Image Editing via Readout-Guided Feature Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8252-8261} }
Single-step Diffusion for Image Compression at Ultra-Low Bitrates-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Chanung and Lee, Joo Chan and Ko, Jong Hwan}, title = {Single-step Diffusion for Image Compression at Ultra-Low Bitrates}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6391-6400} }
TED-4DGS: Temporally Activated and Embedding-based Deformation for 4DGS Compression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ho_2026_WACV, author = {Ho, Cheng-Yuan and Yang, He-Bi and Chiang, Jui-Chiu and Liu, Yu-Lun and Peng, Wen-Hsiao}, title = {TED-4DGS: Temporally Activated and Embedding-based Deformation for 4DGS Compression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6371-6380} }
View-aware Cross-modal Distillation for Multi-view Action Recognition-
[pdf]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Trung Thanh and Kawanishi, Yasutomo and John, Vijay and Komamizu, Takahiro and Ide, Ichiro}, title = {View-aware Cross-modal Distillation for Multi-view Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7769-7778} }
FedEFC: Federated Learning Using Enhanced Forward Correction Against Noisy Labels-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yu_2026_WACV, author = {Yu, Seunghun and Ahn, Jin-Hyun and Kang, Joonhyuk}, title = {FedEFC: Federated Learning Using Enhanced Forward Correction Against Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8094-8102} }
LogicCBMs: Logic-Enhanced Concept-Based Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Vemuri_2026_WACV, author = {Vemuri, Deepika SN and Bellamkonda, Gautham and Pola, Aditya and Balasubramanian, Vineeth N}, title = {LogicCBMs: Logic-Enhanced Concept-Based Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6039-6048} }
FNOPT: Resolution-Agnostic, Self-Supervised Cloth Simulation using Meta-Optimization with Fourier Neural Operators-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Ruochen and Tran, Thuy and Parashar, Shaifali}, title = {FNOPT: Resolution-Agnostic, Self-Supervised Cloth Simulation using Meta-Optimization with Fourier Neural Operators}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7116-7125} }
Diversity Preserving Coresets for Image Quality Assessment-
[pdf]
[supp]
[bibtex]@InProceedings{Nema_2026_WACV, author = {Nema, Arpita and Zhu, Hanwei and Zhang, Xi and Lin, Weisi}, title = {Diversity Preserving Coresets for Image Quality Assessment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7925-7934} }
RoadBench: A Vision-Language Foundation Model and Benchmark for Road Damage Understanding-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xiao_2026_WACV, author = {Xiao, Xi and Zhang, Yunbei and Wang, Janet and Zhao, Lin and Wei, Yuxiang and Li, Hengjia and Li, Yanshu and Wang, Xiao and Roy, Swalpa Kumar and Xu, Hao and Wang, Tianyang}, title = {RoadBench: A Vision-Language Foundation Model and Benchmark for Road Damage Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6016-6026} }
Optimization-Free Style Transfer for 3D Gaussian Splats-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Du_Sablon_2026_WACV, author = {Du Sablon, Raphael and Hart, David}, title = {Optimization-Free Style Transfer for 3D Gaussian Splats}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8041-8051} }
From Cognitive Priors to Instance Semantics: A Unified Framework for Multi-task Affective Computing-
[pdf]
[bibtex]@InProceedings{Hu_2026_WACV, author = {Hu, Guanyu and Kollias, Dimitrios and Yang, Xinyu}, title = {From Cognitive Priors to Instance Semantics: A Unified Framework for Multi-task Affective Computing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8551-8562} }
PoseAdapt: Sustainable Human Pose Estimation via Continual Learning Benchmarks and Toolkit-
[pdf]
[arXiv]
[bibtex]@InProceedings{Khan_2026_WACV, author = {Khan, Muhammad Saif Ullah and Stricker, Didier}, title = {PoseAdapt: Sustainable Human Pose Estimation via Continual Learning Benchmarks and Toolkit}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6840-6850} }
Cycle-Consistent Multi-Graph Matching for Self-Supervised Annotation of C. Elegans-
[pdf]
[supp]
[bibtex]@InProceedings{Stricker_2026_WACV, author = {Stricker, Sebastian and Karg, Christoph and Hutschenreiter, Lisa and Savchynskyy, Bogdan and Kainmueller, Dagmar}, title = {Cycle-Consistent Multi-Graph Matching for Self-Supervised Annotation of C. Elegans}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7208-7217} }
Locally Explaining Prediction Behavior via Gradual Interventions and Measuring Property Gradients-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Penzel_2026_WACV, author = {Penzel, Niklas and Denzler, Joachim}, title = {Locally Explaining Prediction Behavior via Gradual Interventions and Measuring Property Gradients}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7398-7408} }
Scalable Video Action Anticipation with Cross Linear Attentive Memory-
[pdf]
[supp]
[bibtex]@InProceedings{Zhong_2026_WACV, author = {Zhong, Zeyun and Martin, Manuel and Schneider, David and Lerch, David J. and Wu, Chengzhi and Diederichs, Frederik and Gall, Juergen and Beyerer, J\"urgen}, title = {Scalable Video Action Anticipation with Cross Linear Attentive Memory}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8113-8123} }
FairVLM: Enhancing Fairness and Prompt Sensitivity in Vision Language Models for Medical Image Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Rahman_2026_WACV, author = {Rahman, Md Motiur and Rahman, Saeka and Bhatt, Smriti and Faezipour, Miad}, title = {FairVLM: Enhancing Fairness and Prompt Sensitivity in Vision Language Models for Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7450-7460} }
NRGMark: Localized Watermarking for Energy Transparency in Images-
[pdf]
[bibtex]@InProceedings{Agarwal_2026_WACV, author = {Agarwal, Shruti and Michel, \'Elie and Asnani, Vishal and Mathern, Tania and Collomosse, John}, title = {NRGMark: Localized Watermarking for Energy Transparency in Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7779-7788} }
V2XScene: Multi-View Consistent 3D Scene Simulation for Collaborative Perception-
[pdf]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Yanfei and Gong, Yi and Zeng, Yuan}, title = {V2XScene: Multi-View Consistent 3D Scene Simulation for Collaborative Perception}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6569-6579} }
Advancing Multimodal LLMs by Large-Scale 3D Visual Instruction Dataset Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{He_2026_WACV, author = {He, Liu and Zeng, Xiao and Song, Yizhi and Chen, Albert Y. C. and Xia, Lu and Verma, Shashwat and Dayal, Sankalp and Sun, Min and Kuo, Cheng-Hao and Aliaga, Daniel}, title = {Advancing Multimodal LLMs by Large-Scale 3D Visual Instruction Dataset Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5886-5897} }
Test-Time Adaptation for Video Highlight Detection Using Meta-Auxiliary Learning and Cross-Modality Hallucinations-
[pdf]
[arXiv]
[bibtex]@InProceedings{Islam_2026_WACV, author = {Islam, Zahidul and Paul, Sujoy and Rochan, Mrigank}, title = {Test-Time Adaptation for Video Highlight Detection Using Meta-Auxiliary Learning and Cross-Modality Hallucinations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6893-6902} }
Stabilizing Direct Training of Spiking Neural Networks: Membrane Potential Initialization and Threshold-robust Surrogate Gradient-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kook_2026_WACV, author = {Kook, Hyunho and Yu, Byeongho and Oh, Jeong Min and Park, Eunhyeok}, title = {Stabilizing Direct Training of Spiking Neural Networks: Membrane Potential Initialization and Threshold-robust Surrogate Gradient}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8500-8510} }
SphereEdit: Spherical Semantic Editing in Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Konate_2026_WACV, author = {Konate, Salamata and Hamidi, Hassan and Dolatabadi, Elham and Rudzicz, Frank and Seyyed-Kalantari, Laleh}, title = {SphereEdit: Spherical Semantic Editing in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8084-8093} }
S2O: Static to Openable Enhancement for Articulated 3D Objects-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Iliash_2026_WACV, author = {Iliash, Denys and Jiang, Hanxiao and Zhang, Yiming and Savva, Manolis and Chang, Angel X.}, title = {S2O: Static to Openable Enhancement for Articulated 3D Objects}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6785-6795} }
UniGaze: Towards Universal Gaze Estimation via Large-scale Pre-Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Qin_2026_WACV, author = {Qin, Jiawei and Zhang, Xucong and Sugano, Yusuke}, title = {UniGaze: Towards Universal Gaze Estimation via Large-scale Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5809-5820} }
Splatter Layout: Geometry-embedded 3D Reconstruction via Surface Unfolding-
[pdf]
[supp]
[bibtex]@InProceedings{Heryanto_2026_WACV, author = {Heryanto, Bryan and You, Tackgeun and Kim, Chanwoo and Lim, Hwasup}, title = {Splatter Layout: Geometry-embedded 3D Reconstruction via Surface Unfolding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7709-7718} }
Optimal Transport for Rectified Flow Image Editing: Unifying Inversion-Based and Direct Methods-
[pdf]
[supp]
[bibtex]@InProceedings{Lupascu_2026_WACV, author = {Lupa\c{s}cu, Marian and Stupariu, Mihai Sorin}, title = {Optimal Transport for Rectified Flow Image Editing: Unifying Inversion-Based and Direct Methods}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6764-6774} }
ICONIC-444: A 3.1-Million-Image Dataset for OOD Detection Research-
[pdf]
[supp]
[bibtex]@InProceedings{Krumpl_2026_WACV, author = {Krumpl, Gerhard and Avenhaus, Henning and Possegger, Horst}, title = {ICONIC-444: A 3.1-Million-Image Dataset for OOD Detection Research}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8427-8436} }
FuLLaMa: Training-free Diffusion-based Object Removal with Context Preservation-
[pdf]
[supp]
[bibtex]@InProceedings{Demir_2026_WACV, author = {Demir, Ilke and Ciftci, Umur Aybars}, title = {FuLLaMa: Training-free Diffusion-based Object Removal with Context Preservation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8563-8573} }
Where is the Watermark? Interpretable Watermark Detection at the Block Level-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bulychev_2026_WACV, author = {Bulychev, Maria and Marchant, Neil G. and Rubinstein, Benjamin I. P.}, title = {Where is the Watermark? Interpretable Watermark Detection at the Block Level}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7420-7429} }
HABIT: Human Action Benchmark for Interactive Traffic in CARLA-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ramesh_2026_WACV, author = {Ramesh, Mohan and Azer, Mark and Flohr, Fabian}, title = {HABIT: Human Action Benchmark for Interactive Traffic in CARLA}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7148-7157} }
Patch Your Matcher: Correspondence-Aware Image-to-Image Translation Unlocks Cross-Modal Matching via Single-Modality Priors-
[pdf]
[supp]
[bibtex]@InProceedings{Frolov_2026_WACV, author = {Frolov, Anton and Rodehorst, Volker}, title = {Patch Your Matcher: Correspondence-Aware Image-to-Image Translation Unlocks Cross-Modal Matching via Single-Modality Priors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7913-7924} }
A Deep Network for Object Detection on Inland Waters-
[pdf]
[supp]
[bibtex]@InProceedings{Griesser_2026_WACV, author = {Griesser, Dennis and Goldluecke, Bastian and Franz, Matthias O. and Umlauf, Georg}, title = {A Deep Network for Object Detection on Inland Waters}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6590-6599} }
Logit-Adjusted Test-Time Adaptation under Partial Class Imbalance-
[pdf]
[supp]
[bibtex]@InProceedings{Weerasinghe_2026_WACV, author = {Weerasinghe, Thilina and Tennakoon, Ruwan and Chuah, WeiQin and Bab-Hadiashar, Alireza}, title = {Logit-Adjusted Test-Time Adaptation under Partial Class Imbalance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5977-5985} }
AuthGuard: Generalizable Deepfake Detection via Language Guidance-
[pdf]
[arXiv]
[bibtex]@InProceedings{Shen_2026_WACV, author = {Shen, Guangyu and Li, Zhihua and Xu, Xiang and Zhao, Tianchen and Zhang, Zheng and An, Dongsheng and Tu, Zhuowen and Xing, Yifan and Zhang, Qin}, title = {AuthGuard: Generalizable Deepfake Detection via Language Guidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6215-6225} }
VIZOR: Viewpoint-Invariant Zero-Shot Scene Graph Generation for 3D Scene Reasoning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Madhavaram_2026_WACV, author = {Madhavaram, Vivek and Sengar, Vartika and De, Arkadipta and Sharma, Charu}, title = {VIZOR: Viewpoint-Invariant Zero-Shot Scene Graph Generation for 3D Scene Reasoning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8584-8595} }
Gaussian Splatting Map Registration with Orthographic Bird's-Eye-View Renderings-
[pdf]
[supp]
[bibtex]@InProceedings{Leblond_2026_WACV, author = {Leblond, H. and Simon, G. and Martins, R. and Demonceaux, C. and Berger, M.-O.}, title = {Gaussian Splatting Map Registration with Orthographic Bird's-Eye-View Renderings}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6080-6089} }
IPCD: Intrinsic Point-Cloud Decomposition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sato_2026_WACV, author = {Sato, Shogo and Kaneko, Takuhiro and Takeda, Shoichiro and Shimada, Tomoyasu and Murasaki, Kazuhiko and Yoshida, Taiga and Tanida, Ryuichi and Kimura, Akisato}, title = {IPCD: Intrinsic Point-Cloud Decomposition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7094-7103} }
Diffusion Noise Optimization for Synthetic VLM Training-
[pdf]
[supp]
[bibtex]@InProceedings{Ohkubo_2026_WACV, author = {Ohkubo, Ren and Yanagi, Rintaro and Kataoka, Hirokatsu and Satoh, Yutaka}, title = {Diffusion Noise Optimization for Synthetic VLM Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6412-6421} }
TacticalCalib: End-to-End 6-DoF Camera Pose Regression for Tactical Camera Calibration-
[pdf]
[bibtex]@InProceedings{Fan_2026_WACV, author = {Fan, Liang and Liu, Xiaoqian and Chen, Zhi and Yang, Lingkai}, title = {TacticalCalib: End-to-End 6-DoF Camera Pose Regression for Tactical Camera Calibration}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6547-6556} }
FlowCLAS: Enhancing Normalizing Flow-Based Anomaly Segmentation Via Contrastive Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Chang Won and Leveugle, Selina and Grouchy, Paul and Langley, Chris and Stolpner, Svetlana and Kelly, Jonathan and Waslander, Steven L.}, title = {FlowCLAS: Enhancing Normalizing Flow-Based Anomaly Segmentation Via Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6998-7007} }
SuperRivolution: Fine-Scale Rivers from Coarse Temporal Satellite Imagery-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Daroya_2026_WACV, author = {Daroya, Rangel and Maji, Subhransu}, title = {SuperRivolution: Fine-Scale Rivers from Coarse Temporal Satellite Imagery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7482-7492} }
R-MMA: Enhancing Vision-Language Models with Recurrent Adapters for Few-Shot and Cross-Domain Generalization-
[pdf]
[supp]
[bibtex]@InProceedings{Fahim_2026_WACV, author = {Fahim, Md and Ishmam, Md Farhan and Hossain, Mir Sazzat and Amin, M Ashraful and Ali, Amin Ahsan and Rahman, AKM Mahbubur}, title = {R-MMA: Enhancing Vision-Language Models with Recurrent Adapters for Few-Shot and Cross-Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6496-6506} }
TRACE: Confounder-free Adversarial Fine-tuning for Robust Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Wonho and Lee, Jisu and Na, Hyunsik and Park, Sohee and Choi, Daeseon}, title = {TRACE: Confounder-free Adversarial Fine-tuning for Robust Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6705-6714} }
SOLAR: Switchable Output Layer for Accuracy and Robustness in Once-for-All Training-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tareen_2026_WACV, author = {Tareen, Shaharyar Ahmed Khan and Fan, Lei and Yuan, Xiaojing and Lin, Qin and Hu, Bin}, title = {SOLAR: Switchable Output Layer for Accuracy and Robustness in Once-for-All Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7893-7902} }
DexAvatar: 3D Sign Language Reconstruction with Hand and Body Pose Priors-
[pdf]
[supp]
[bibtex]@InProceedings{Kundu_2026_WACV, author = {Kundu, Kaustubh and Barua, Hrishav Bakul and Robertson-Bell, Lucy and Cai, Zhixi and Stefanov, Kalin}, title = {DexAvatar: 3D Sign Language Reconstruction with Hand and Body Pose Priors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5842-5852} }
SegMo: Segment-aligned Text to 3D Human Motion Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dang_2026_WACV, author = {Dang, Bowen and Wu, Lin and Yang, Xiaohang and Yuan, Zheng and Chen, Zhixiang}, title = {SegMo: Segment-aligned Text to 3D Human Motion Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6946-6955} }
SceneProp: Combining Neural Network and Markov Random Field for Scene-Graph Grounding-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Otani_2026_WACV, author = {Otani, Keita and Harada, Tatsuya}, title = {SceneProp: Combining Neural Network and Markov Random Field for Scene-Graph Grounding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6153-6162} }
WiSAR3D - Aerial LiDAR Dataset for 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Shrout_2026_WACV, author = {Shrout, Oren and Nizan, Ori and Ben-Shabat, Yizhak and Tal, Ayellet}, title = {WiSAR3D - Aerial LiDAR Dataset for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6580-6589} }
Exploiting Label-Independent Regularization from Spatial Patterns for Whole Slide Image Analysis-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2026_WACV, author = {Wu, Weiyi and Xu, Xinwen and Gao, Chongyang and Diao, Xingjian and Li, Siting and Gui, Jiang}, title = {Exploiting Label-Independent Regularization from Spatial Patterns for Whole Slide Image Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8639-8649} }
Co-STAR: Collaborative Curriculum Self-Training with Adaptive Regularization for Source-Free Video Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dadashzadeh_2026_WACV, author = {Dadashzadeh, Amirhossein and Esmati, Parsa and Mirmehdi, Majid}, title = {Co-STAR: Collaborative Curriculum Self-Training with Adaptive Regularization for Source-Free Video Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7821-7831} }
QuEENet: Quantum-Enhanced Expressive Network for Image Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Bayal_2026_WACV, author = {Bayal, Shashank and Dawane, Rushikesh Govind and Komal, Komal and Vipparthi, Santosh Kumar and Murala, Subrahmanyam}, title = {QuEENet: Quantum-Enhanced Expressive Network for Image Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7883-7892} }
SHaSaM: Submodular Hard Sample Mining for Fair Facial Attribute Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Majee_2026_WACV, author = {Majee, Anay and Iyer, Rishabh}, title = {SHaSaM: Submodular Hard Sample Mining for Fair Facial Attribute Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7461-7471} }
SGD-Mix: Enhancing Domain-Specific Image Classification with Label-Preserving Data Augmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Dong_2026_WACV, author = {Dong, Yixuan and Su, Fang-Yi and Chiang, Jung-Hsien}, title = {SGD-Mix: Enhancing Domain-Specific Image Classification with Label-Preserving Data Augmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7051-7061} }
Unsupervised Discovery of Long-Term Spatiotemporal Periodic Workflows in Human Activities-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2026_WACV, author = {Yang, Fan and Xie, Quanting and Moteki, Atsunori and Masui, Shoichi and Jiang, Shan and Uchino, Kanji and Bisk, Yonatan and Neubig, Graham}, title = {Unsupervised Discovery of Long-Term Spatiotemporal Periodic Workflows in Human Activities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5821-5832} }
Revisiting an Old Perspective Projection for Monocular 3D Morphable Models Regression-
[pdf]
[bibtex]@InProceedings{Chong_2026_WACV, author = {Chong, Toby and Nakajima, Ryota}, title = {Revisiting an Old Perspective Projection for Monocular 3D Morphable Models Regression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7799-7808} }
SafeguardGS: 3D Gaussian Primitive Pruning While Avoiding Catastrophic Scene Destruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Yongjae and Zhang, Zhaoliang and Fan, Deliang}, title = {SafeguardGS: 3D Gaussian Primitive Pruning While Avoiding Catastrophic Scene Destruction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8479-8489} }
Deep Image Decomposition for Medical Imaging Anonymization and Curation-
[pdf]
[supp]
[bibtex]@InProceedings{Elkin_2026_WACV, author = {Elkin, Yael and Ben-Arie, Gal and Riklin-Raviv, Tammy}, title = {Deep Image Decomposition for Medical Imaging Anonymization and Curation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7229-7238} }
Clear Sights on Site: A Spatial-Adaptive Channel Network for Deblurring Construction Site Images-
[pdf]
[supp]
[bibtex]@InProceedings{Bonyani_2026_WACV, author = {Bonyani, Mahdi and Soleymani, Maryam and Wang, Chao}, title = {Clear Sights on Site: A Spatial-Adaptive Channel Network for Deblurring Construction Site Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6936-6945} }
GRAPE (Gaussian Rendering for Accelerated Pixel Enhancement) Brings Fast and Lightweight Arbitrary Super-Resolution-
[pdf]
[supp]
[bibtex]@InProceedings{Jang_2026_WACV, author = {Jang, Jung In and Jin, Kyong Hwan}, title = {GRAPE (Gaussian Rendering for Accelerated Pixel Enhancement) Brings Fast and Lightweight Arbitrary Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7750-7758} }
HodgeFormer: Transformers for Learnable Operators on Triangular Meshes through Data-Driven Hodge Matrices-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nousias_2026_WACV, author = {Nousias, Akis and Nousias, Stavros}, title = {HodgeFormer: Transformers for Learnable Operators on Triangular Meshes through Data-Driven Hodge Matrices}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6796-6805} }
Uplifting Table Tennis: A Robust, Real-World Application for 3D Trajectory and Spin Estimation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kienzle_2026_WACV, author = {Kienzle, Daniel and Ludwig, Katja and Lorenz, Julian and Satoh, Shin'Ichi and Lienhart, Rainer}, title = {Uplifting Table Tennis: A Robust, Real-World Application for 3D Trajectory and Spin Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7440-7449} }
GeneVA: A Dataset of Human Annotations for Generative Text to Video Artifacts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kang_2026_WACV, author = {Kang, Jenna and Silva, Maria Beatriz and Sangkloy, Patsorn and Chen, Kenneth and Williams, Niall L. and Sun, Qi}, title = {GeneVA: A Dataset of Human Annotations for Generative Text to Video Artifacts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6174-6183} }
Synthesizing Compositional Videos from Text Description-
[pdf]
[supp]
[bibtex]@InProceedings{Singh_2026_WACV, author = {Singh, Prajwal and Kulkarni, Kuldeep and Raman, Shanmuganathan and Rangwani, Harsh}, title = {Synthesizing Compositional Videos from Text Description}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6775-6784} }
SSMT-Net: A Semi-Supervised Multitask Transformer-Based Network for Thyroid Nodule Segmentation in Ultrasound Images-
[pdf]
[bibtex]@InProceedings{Farooq_2026_WACV, author = {Farooq, Muhammad Umar and Rehman, Abd Ur and Rehman, Azka and Usman, Muhammad and Chae, Dong-Kyu}, title = {SSMT-Net: A Semi-Supervised Multitask Transformer-Based Network for Thyroid Nodule Segmentation in Ultrasound Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6069-6079} }
SAVE: Sparse Autoencoder-Driven Visual Information Enhancement for Mitigating Object Hallucination-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Park_2026_WACV, author = {Park, Sangha and Yoo, Seungryong and Mok, Jisoo and Yoon, Sungroh}, title = {SAVE: Sparse Autoencoder-Driven Visual Information Enhancement for Mitigating Object Hallucination}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7935-7944} }
Non-Aligned Reference Image Quality Assessment for Novel View Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ghildyal_2026_WACV, author = {Ghildyal, Abhijay and Sureddi, Rajesh and Barman, Nabajeet and Zadtootaghaj, Saman and Bovik, Alan C}, title = {Non-Aligned Reference Image Quality Assessment for Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6350-6359} }
BAFLE-DCT: Bypassing Adversarial Filters via Frequency-Selective Embedding in the DCT Domain-
[pdf]
[bibtex]@InProceedings{Mendis_2026_WACV, author = {Mendis, Thilina and Kandah, Farah and Aakur, Sathyanarayanan N.}, title = {BAFLE-DCT: Bypassing Adversarial Filters via Frequency-Selective Embedding in the DCT Domain}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5967-5976} }
VLMDiff: Leveraging Vision-Language Models for Multi-Class Anomaly Detection with Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hicsonmez_2026_WACV, author = {Hicsonmez, Samet and El Rahman Shabayek, Abd and Aouada, Djamila}, title = {VLMDiff: Leveraging Vision-Language Models for Multi-Class Anomaly Detection with Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6309-6319} }
MapVerse: A Benchmark for Geospatial Question Answering on Diverse Real-World Maps-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bhat_2026_WACV, author = {Bhat, Sharat and Khandelwal, Harshita and Kataria, Tushar and Gupta, Vivek}, title = {MapVerse: A Benchmark for Geospatial Question Answering on Diverse Real-World Maps}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8168-8178} }
Integrating Multi-scale and Multi-filtration Topological Features for Medical Image Classification-
[pdf]
[arXiv]
[bibtex]@InProceedings{Gu_2026_WACV, author = {Gu, Pengfei and Li, Huimin and Tang, Haoteng and Xu, Dongkuan and Enriquez, Erik and Kim, DongChul and Fu, Bin and Chen, Danny Z}, title = {Integrating Multi-scale and Multi-filtration Topological Features for Medical Image Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8660-8669} }
FlyPose: Towards Robust Human Pose Estimation From Aerial Views-
[pdf]
[bibtex]@InProceedings{Farooq_2026_WACV, author = {Farooq, Hassaan and Brenner, Marvin and St\"utz, Peter}, title = {FlyPose: Towards Robust Human Pose Estimation From Aerial Views}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8617-8627} }
SAVeD: Learning to Denoise Low-SNR Video for Improved Downstream Performance-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Stathatos_2026_WACV, author = {Stathatos, Suzanne and Hobley, Michael and Perona, Pietro and Marks, Markus}, title = {SAVeD: Learning to Denoise Low-SNR Video for Improved Downstream Performance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6851-6861} }
See, Record, Do: Automated Generation of UI Workflows from Tutorial Videos-
[pdf]
[bibtex]@InProceedings{Beauchaine_2026_WACV, author = {Beauchaine, Adam and Shue, Craig}, title = {See, Record, Do: Automated Generation of UI Workflows from Tutorial Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6256-6265} }
VADER: Towards Causal Video Anomaly Understanding with Relation-Aware Large Language Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2026_WACV, author = {Cheng, Ying and Lin, Yu-Ho and Chen, Min-Hung and Yang, Fu-En and Lai, Shang-Hong}, title = {VADER: Towards Causal Video Anomaly Understanding with Relation-Aware Large Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7301-7311} }
Pretraining Helps When Capacity Allows: Evidence from Ultra-Small ConvNets-
[pdf]
[supp]
[bibtex]@InProceedings{Muralidharan_2026_WACV, author = {Muralidharan, Srikanth and Medeiros, Heitor R. and Aminbeidokhti, Masih and Granger, Eric and Pedersoli, Marco}, title = {Pretraining Helps When Capacity Allows: Evidence from Ultra-Small ConvNets}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8333-8342} }
SmoothDiffusion-VE: Real-time Generative Video Editing Using Adaptive Feature Cache-
[pdf]
[supp]
[bibtex]@InProceedings{Munir_2026_WACV, author = {Munir, Mustafa and Zalewski, Sophia and Liu, Shiqiu and Tarjan, David and Belede, Sushmitha and Patney, Anjul and Marculescu, Radu}, title = {SmoothDiffusion-VE: Real-time Generative Video Editing Using Adaptive Feature Cache}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8468-8478} }
Leveraging Sparsity for Privacy in Collaborative Inference-
[pdf]
[supp]
[bibtex]@InProceedings{Hoefler_2026_WACV, author = {Hoefler, Maximilian Andreas and Mueller, Karsten and Samek, Wojciech}, title = {Leveraging Sparsity for Privacy in Collaborative Inference}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7596-7604} }
UltraClean: A Simple Framework to Train Robust Neural Networks against Backdoor Attacks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2026_WACV, author = {Zhao, Bingyin and Lao, Yingjie}, title = {UltraClean: A Simple Framework to Train Robust Neural Networks against Backdoor Attacks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8353-8363} }
QAL : A Loss for Recall-Precision Balance in 3D Reconstruction-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Meshram_2026_WACV, author = {Meshram, Pranay and Turkar, Yash and Singh, Kartikeya and Masilamani, Praveen Raj and Adhivarahan, Charuvahan and Dantu, Karthik}, title = {QAL : A Loss for Recall-Precision Balance in 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7965-7974} }
DualRes: Production-ready Dynamic Object Detection-
[pdf]
[bibtex]@InProceedings{El_Hassani_2026_WACV, author = {El Hassani, Jibril and Verelst, Thomas}, title = {DualRes: Production-ready Dynamic Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7842-7851} }
Meta-YOLO: Metadata-Guided Real-Time Object Detector in Aerial Imagery-
[pdf]
[supp]
[bibtex]@InProceedings{Yoon_2026_WACV, author = {Yoon, Deukryeol and Kim, Seonghak and Sung, Young Hwa and Jung, Jinho}, title = {Meta-YOLO: Metadata-Guided Real-Time Object Detector in Aerial Imagery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7975-7984} }
Generalized Category Discovery for LiDAR Semantic Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Minseok and Boo, Jiyong and Yoon, Kuk-Jin}, title = {Generalized Category Discovery for LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8416-8426} }
NeuroBridge: Few-Shot Cross-Modal Neuron Re-identification via Dual-Channel Deep Metric Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2026_WACV, author = {Li, Wenwei and Liao, Mingwei and Cai, Lingyi and Li, Anan}, title = {NeuroBridge: Few-Shot Cross-Modal Neuron Re-identification via Dual-Channel Deep Metric Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8670-8679} }
IPTQ-ViT: Post-Training Quantization of Non-linear Functions for Integer-only Vision Transformers-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Gihwan and Lee, Jemin and Kim, Hyungshin}, title = {IPTQ-ViT: Post-Training Quantization of Non-linear Functions for Integer-only Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7366-7375} }
Denoise, Divide, Distill, and Predict (D3P): Towards Forecasting Long-horizon Real-world Anomaly from Normalcy-
[pdf]
[bibtex]@InProceedings{Merilleau_2026_WACV, author = {M\'erilleau, Quentin and Majhi, Snehashis and Dantcheva, Antitza and Kong, Quan and Garattoni, Lorenzo and Francesca, Gianpiero and Bremond, Francois}, title = {Denoise, Divide, Distill, and Predict (D3P): Towards Forecasting Long-horizon Real-world Anomaly from Normalcy}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6246-6255} }
Zero-Shot Domain Generalisation via Prompt-Driven Feature Refinement-
[pdf]
[bibtex]@InProceedings{Qiao_2026_WACV, author = {Qiao, Tingrui and Zhao, Di and Walker, Caroline and Cunningham, Chris and Koh, Yun Sing}, title = {Zero-Shot Domain Generalisation via Prompt-Driven Feature Refinement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6184-6193} }
Generalizing Sports Feedback Generation by Watching Competitions and Reading Books: A Rock Climbing Case Study-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rai_2026_WACV, author = {Rai, Arushi and Kovashka, Adriana}, title = {Generalizing Sports Feedback Generation by Watching Competitions and Reading Books: A Rock Climbing Case Study}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8136-8145} }
Neural Geometry Image-Based Representations with Optimal Transport (OT)-
[pdf]
[arXiv]
[bibtex]@InProceedings{Gao_2026_WACV, author = {Gao, Xiang and Liu, Yuanpeng and Li, Jiazhi and Wang, Xinmu and Guo, Minghao and Guo, Yu and Song, Xiyun and Yu, Heather and Lao, Zhiqiang and Gu, Xianfeng David}, title = {Neural Geometry Image-Based Representations with Optimal Transport (OT)}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6676-6686} }
Multimodal Adversarial Defense for Vision-Language Models by Leveraging One-To-Many Relationships-
[pdf]
[supp]
[bibtex]@InProceedings{Waseda_2026_WACV, author = {Waseda, Futa and Tejero-de-Pablos, Antonio and Echizen, Isao}, title = {Multimodal Adversarial Defense for Vision-Language Models by Leveraging One-To-Many Relationships}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6968-6977} }
Sketch3R: Rapid and Realistic 3D VR Sketch Creation to Shape Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Halder_2026_WACV, author = {Halder, Mritunjoy and Shukla, Shivam Ashok and Tiwari, Lokender and Mittal, Raghav and Bhowmick, Brojeshwar}, title = {Sketch3R: Rapid and Realistic 3D VR Sketch Creation to Shape Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8680-8689} }
MapleGrasp: Mask-guided Feature Pooling for Language-driven Efficient Robotic Grasping-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bhat_2026_WACV, author = {Bhat, Vineet and Patel, Naman and Krishnamurthy, Prashanth and Karri, Ramesh and Khorrami, Farshad}, title = {MapleGrasp: Mask-guided Feature Pooling for Language-driven Efficient Robotic Grasping}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7554-7564} }
QUOTA: Quantifying Objects with Text-to-Image Models for Any Domain-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sun_2026_WACV, author = {Sun, Wenfang and Du, Yingjun and Liu, Gaowen and Zheng, Yefeng and Snoek, Cees G. M.}, title = {QUOTA: Quantifying Objects with Text-to-Image Models for Any Domain}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6381-6390} }
Chain-of-Look Spatial Reasoning for Dense Surgical Instrument Counting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bhyri_2026_WACV, author = {Bhyri, Rishikesh and Quaranto, Brian R and Yuan, Junsong and Kim, Peter C W and Xi, Nan}, title = {Chain-of-Look Spatial Reasoning for Dense Surgical Instrument Counting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8521-8530} }
Towards Fine-Grained Adaptation of CLIP via a Self-Trained Alignment Score-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ali_2026_WACV, author = {Ali, Eman and Silva, Sathira and Arora, Chetan and Khan, Muhammad Haris}, title = {Towards Fine-Grained Adaptation of CLIP via a Self-Trained Alignment Score}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5875-5885} }
GFT-GCN: Privacy-Preserving 3D Face Mesh Recognition with Spectral Diffusion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Felouat_2026_WACV, author = {Felouat, Hichem and Wang, Hanrui and Echizen, Isao}, title = {GFT-GCN: Privacy-Preserving 3D Face Mesh Recognition with Spectral Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6236-6245} }
Disentangle and Regularize: Sign Language Production with Articulator-Based Disentanglement and Channel-Aware Regularization-
[pdf]
[supp]
[bibtex]@InProceedings{Tasyurek_2026_WACV, author = {Ta\c{s}y\"urek, S\"umeyye Meryem and K{\i}z{\i}ltepe, Tu\u{g}\c{c}e and Keles, Hacer Yalim}, title = {Disentangle and Regularize: Sign Language Production with Articulator-Based Disentanglement and Channel-Aware Regularization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8458-8467} }
MIST: Multilingual Incidental Dataset for Scene Text Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Mundra_2026_WACV, author = {Mundra, Saumya and Mondal, Ajoy and Jawahar, C.V.}, title = {MIST: Multilingual Incidental Dataset for Scene Text Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7658-7667} }
VAST-ReID: A Low-Light Benchmark Dataset for Person Re-Identification with Visual and Attribute-Rich Semantic Tracking-
[pdf]
[supp]
[bibtex]@InProceedings{Khan_2026_WACV, author = {Khan, Hammad and Giri, Rakesh Kumar and Thakare, Kamalakar Vijay and Choi, Heeseung and Jung, Hyungjoo and Dogra, Debi Prosad and Kim, Ig-Jae}, title = {VAST-ReID: A Low-Light Benchmark Dataset for Person Re-Identification with Visual and Attribute-Rich Semantic Tracking}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5833-5841} }
Robust Scene Coordinate Regression via Geometrically-Consistent Global Descriptors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Son Tung and Fontan, Alejandro and Milford, Michael and Fischer, Tobias}, title = {Robust Scene Coordinate Regression via Geometrically-Consistent Global Descriptors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8209-8219} }
PointSt3R: Point Tracking through 3D Ground Correspondence-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Guerrier_2026_WACV, author = {Guerrier, Rhodri and Harley, Adam W. and Damen, Dima}, title = {PointSt3R: Point Tracking through 3D Ground Correspondence}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7430-7439} }
NoHumansRequired: Autonomous High-Quality Image Editing Triplet Mining-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kuprashevich_2026_WACV, author = {Kuprashevich, Maksim and Alekseenko, Grigorii and Tolstykh, Irina and Fedorov, Georgii and Suleimanov, Bulat and Dokholyan, Vladimir and Gordeev, Aleksandr}, title = {NoHumansRequired: Autonomous High-Quality Image Editing Triplet Mining}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6059-6068} }
DuPLUS: Dual-Prompt Vision-Language Model for Universal Medical Image Segmentation and Prognosis-
[pdf]
[supp]
[bibtex]@InProceedings{Saeed_2026_WACV, author = {Saeed, Numan and Saleem, Tausifa Jan and Maani, Fadillah and Ridzuan, Muhammad and Wang, Hu and Yaqub, Mohammad}, title = {DuPLUS: Dual-Prompt Vision-Language Model for Universal Medical Image Segmentation and Prognosis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8386-8395} }
Relevance-aware Multi-context Contrastive Decoding for Retrieval-augmented Visual Question Answering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2026_WACV, author = {Kim, Jongha and Ko, Byungoh and Na, Jeehye and Yoon, Jinsung and Kim, Hyunwoo J.}, title = {Relevance-aware Multi-context Contrastive Decoding for Retrieval-augmented Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8596-8605} }
Image-Guided Semantic Pseudo-LiDAR Point Generation for 3D Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Minseung and Moon, Seokha and Lee, Seung Joon and Mahjourian, Reza and Kim, Jinkyu}, title = {Image-Guided Semantic Pseudo-LiDAR Point Generation for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7137-7147} }
Intraoperative 2D/3D Registration via Spherical Similarity Learning and Differentiable Levenberg-Marquardt Optimization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Minheng and Kong, Youyong}, title = {Intraoperative 2D/3D Registration via Spherical Similarity Learning and Differentiable Levenberg-Marquardt Optimization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7239-7249} }
Bridging the Domain Gap in Small Multimodal Models: A Dual-level Alignment Perspective-
[pdf]
[supp]
[bibtex]@InProceedings{Dayal_2026_WACV, author = {Dayal, Aveen and Divya, Peketi and Tiwari, Nidhi and Cenkeramaddi, Linga Reddy and Mohan, C Krishna and Kumar, Abhinav}, title = {Bridging the Domain Gap in Small Multimodal Models: A Dual-level Alignment Perspective}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8262-8271} }
ChartQA-X: Generating Explanations for Visual Chart Reasoning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hegde_2026_WACV, author = {Hegde, Shamanthak and Fazli, Pooyan and Seifi, Hasti}, title = {ChartQA-X: Generating Explanations for Visual Chart Reasoning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6453-6463} }
RealDroneVision: Dataset and Architecture Advancements for Small-Object Drone Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Sivapuram_2026_WACV, author = {Sivapuram, Arun Kumar and Peddinti, Pranav R T and Puppala, Harish and Prashanth, Komuravelli and Harsha, Jaladi Sri and Gorthi, Rama Krishna Sai}, title = {RealDroneVision: Dataset and Architecture Advancements for Small-Object Drone Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6687-6695} }
brat: Aligned Multi-View Embeddings for Brain MRI Analysis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kayser_2026_WACV, author = {Kayser, Maxime and Gridnev, Maksim and Wang, Wanting and Bain, Max and Rangnekar, Aneesh and Chatterjee, Avijit and Petrov, Aleksandr and Veeraraghavan, Harini and Swinburne, Nathaniel C.}, title = {brat: Aligned Multi-View Embeddings for Brain MRI Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5864-5874} }
Histogram Assisted Quality Aware Generative Model for Resolution Invariant NIR Image Colorization-
[pdf]
[arXiv]
[bibtex]@InProceedings{Attri_2026_WACV, author = {Attri, Abhinav and Dwivedi, Rajeev Ranjan and Das, Samiran and Kurmi, Vinod Kumar}, title = {Histogram Assisted Quality Aware Generative Model for Resolution Invariant NIR Image Colorization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6422-6431} }
Fetal and Neonatal Cortical Surface Reconstruction with Anatomical Normal-guidance and Perceptual Enhancements-
[pdf]
[bibtex]@InProceedings{Lee_2026_WACV, author = {Lee, Jiyang and Bae, Woori and Ji, U-Geun and Yang, Hanyeol and Lee, Jong-Min}, title = {Fetal and Neonatal Cortical Surface Reconstruction with Anatomical Normal-guidance and Perceptual Enhancements}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7759-7768} }
TriaGS: Differentiable Triangulation-Guided Geometric Consistency for 3D Gaussian Splatting-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tran_2026_WACV, author = {Tran, Quan and Dang, Tuan}, title = {TriaGS: Differentiable Triangulation-Guided Geometric Consistency for 3D Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8396-8405} }
PALMS+: Modular Image-Based Floor Plan Localization Leveraging Depth Foundation Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cheng_2026_WACV, author = {Cheng, Yunqian and Princen, Benjamin and Manduchi, Roberto}, title = {PALMS+: Modular Image-Based Floor Plan Localization Leveraging Depth Foundation Model}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7084-7093} }
Advancing Player Identification and Tracking with Global ID Fusion (GIF)-
[pdf]
[supp]
[bibtex]@InProceedings{Wojtulewicz_2026_WACV, author = {Wojtulewicz, Karol and Liu, Minxing and Carlsson, Niklas}, title = {Advancing Player Identification and Tracking with Global ID Fusion (GIF)}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7269-7280} }
VRAgent: Self-Refining Agent for Zero-Shot Multimodal Video Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Shah_2026_WACV, author = {Shah, Ketul and Nathani, Pankaj and Chellappa, Rama and Heilbron, Fabian Caba}, title = {VRAgent: Self-Refining Agent for Zero-Shot Multimodal Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8157-8167} }
Alignment and Distillation: A Robust Framework for Multimodal Domain Generalizable Human Action Recognition-
[pdf]
[bibtex]@InProceedings{Ji_2026_WACV, author = {Ji, Hyeonbin and Lee, Juyeob and Park, Eunil}, title = {Alignment and Distillation: A Robust Framework for Multimodal Domain Generalizable Human Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6913-6924} }
Correcting and Quantifying Systematic Errors in 3D Box Annotations for Autonomous Driving-
[pdf]
[arXiv]
[bibtex]@InProceedings{Miro_2026_WACV, author = {Miro, Alexandre Justo and af Klinteberg, Ludvig and Timus, Bogdan and Asefaw, Aron and Khoche, Ajinkya and Gustafsson, Thomas and Mansouri, Sina Sharif and Daneshtalab, Masoud}, title = {Correcting and Quantifying Systematic Errors in 3D Box Annotations for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6724-6732} }
CaFlow: Enhancing Long-Term Action Quality Assessment with Causal Counterfactual Flow-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Han_2026_WACV, author = {Han, Ruisheng and Zhou, Kanglei and Chen, Shuang and Atapour-Abarghouei, Amir and Shum, Hubert P. H.}, title = {CaFlow: Enhancing Long-Term Action Quality Assessment with Causal Counterfactual Flow}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8231-8241} }
Learning Beyond Labels: Self-Supervised Handwritten Text Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Mitra_2026_WACV, author = {Mitra, Shree and Mondal, Ajoy and Jawahar, C.V.}, title = {Learning Beyond Labels: Self-Supervised Handwritten Text Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6653-6663} }
KMOPS: Keypoint-Driven Method for Multi-Object Pose and Metric Size Estimation from Stereo Images-
[pdf]
[supp]
[bibtex]@InProceedings{Wu_2026_WACV, author = {Wu, Ying-Kun and Shen, Yi and Huang, Tzuhsuan and Fang, I-Sheng and Chen, Jun-Cheng}, title = {KMOPS: Keypoint-Driven Method for Multi-Object Pose and Metric Size Estimation from Stereo Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7730-7739} }
Isolating the Role of Temporal Information in Video Saliency: A Controlled Experimental Analysis-
[pdf]
[supp]
[bibtex]@InProceedings{El-Jiz_2026_WACV, author = {El-Jiz, Peter and Kuemmerer, Matthias and Tangemann, Matthias and Bethge, Matthias and Bartels, Andreas and Bannert, Michael Mario}, title = {Isolating the Role of Temporal Information in Video Saliency: A Controlled Experimental Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5909-5918} }
ScoreNet: Netting Lightweight Quality Scores for Better Visual Assessment with Large Multi-Modality Models-
[pdf]
[supp]
[bibtex]@InProceedings{Rashidi_2026_WACV, author = {Rashidi, Bahador and Aghakasiri, Kiarash and Zhang, Shupei and Sattarifard, Amirmohsen and Zhang, Yue and Gao, Chao}, title = {ScoreNet: Netting Lightweight Quality Scores for Better Visual Assessment with Large Multi-Modality Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7008-7018} }
Digital Forensic AI You Can Explain: A Case Study on Video Source Camera Identification-
[pdf]
[bibtex]@InProceedings{Veksler_2026_WACV, author = {Veksler, Maryna and Akkaya, Kemal and Uluagac, Selcuk}, title = {Digital Forensic AI You Can Explain: A Case Study on Video Source Camera Identification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7030-7039} }
CoreCaption: Core Caption based Text-to-Video Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Jang_2026_WACV, author = {Jang, Junkyu}, title = {CoreCaption: Core Caption based Text-to-Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6600-6610} }
Semantic Map Guided Bird's-Eye View Learning for Online HD Map Construction-
[pdf]
[bibtex]@InProceedings{Ren_2026_WACV, author = {Ren, Huantao and Eraqi, Hesham M. and Musa, ABM and Moustafa, Mohamed}, title = {Semantic Map Guided Bird's-Eye View Learning for Online HD Map Construction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7852-7861} }
Enhancing Monocular 3D Hand Reconstruction with Learned Texture Priors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Karvounas_2026_WACV, author = {Karvounas, Giorgos and Kyriazis, Nikolaos and Oikonomidis, Iason and Pavlakos, Georgios and Argyros, Antonis A.}, title = {Enhancing Monocular 3D Hand Reconstruction with Learned Texture Priors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7073-7083} }
ACuRE: Accurate Continuity-Regularized SpO2 Estimation Using Liquid Time-Constant Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Ahmad_2026_WACV, author = {Ahmad, Shahzad and Mishra, Divya and Bano, Sania and Chanda, Sukalpa and Rawat, Yogesh Singh}, title = {ACuRE: Accurate Continuity-Regularized SpO2 Estimation Using Liquid Time-Constant Networks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7250-7259} }
SceneShine: Illumination-aware Human Scene Gaussian Re-Splatting from Mobile Device Video-
[pdf]
[supp]
[bibtex]@InProceedings{Ren_2026_WACV, author = {Ren, Xuqian and Wang, Wenjia and Nguyen, Mai Ngoc and Kannala, Juho and Rahtu, Esa}, title = {SceneShine: Illumination-aware Human Scene Gaussian Re-Splatting from Mobile Device Video}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8302-8312} }
T2VWorldBench: A Benchmark for Evaluating World Knowledge in Text-to-Video Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2026_WACV, author = {Chen, Yubin and Guo, Xuyang and Shi, Zhenmei and Song, Zhao and Zhang, Jiahao}, title = {T2VWorldBench: A Benchmark for Evaluating World Knowledge in Text-to-Video Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6474-6485} }
Back
