WACV 2026 Open Access Repository

Papers

Back
ATM: Enhanced Alignment for Text-to-Motion Generation: Ke Han,

Yueming Lyu,

Weichen Yu,

Nicu Sebe; [pdf] [supp]
[bibtex]
@InProceedings{Han_2026_WACV, author = {Han, Ke and Lyu, Yueming and Yu, Weichen and Sebe, Nicu}, title = {ATM: Enhanced Alignment for Text-to-Motion Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6862-6872} }
GFT: Graph Feature Tuning for Efficient Point Cloud Analysis: Manish Dhakal,

Venkat R Dasari,

Rajshekhar Sunderraman,

Yi Ding; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dhakal_2026_WACV, author = {Dhakal, Manish and Dasari, Venkat R and Sunderraman, Rajshekhar and Ding, Yi}, title = {GFT: Graph Feature Tuning for Efficient Point Cloud Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7955-7964} }
FG-TRACER: Tracing Information Flow in Multimodal Large Language Models in Free-Form Generation: Alessia Saporita,

Vittorio Pipoli,

Federico Bolelli,

Lorenzo Baraldi,

Andrea Acquaviva,

Elisa Ficarra; [pdf] [supp]
[bibtex]
@InProceedings{Saporita_2026_WACV, author = {Saporita, Alessia and Pipoli, Vittorio and Bolelli, Federico and Baraldi, Lorenzo and Acquaviva, Andrea and Ficarra, Elisa}, title = {FG-TRACER: Tracing Information Flow in Multimodal Large Language Models in Free-Form Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7903-7912} }
CAST: Evaluating Multi-Object Trackers with Context-Aware Switch and Transfer Scores: Jin Bai,

Gregory D. Hager; [pdf]
[bibtex]
@InProceedings{Bai_2026_WACV, author = {Bai, Jin and Hager, Gregory D.}, title = {CAST: Evaluating Multi-Object Trackers with Context-Aware Switch and Transfer Scores}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7260-7268} }
NavMapFusion: Diffusion-based Fusion of Navigation Maps for Online Vectorized HD Map Construction: Thomas Monninger,

Zihan Zhang,

Steffen Staab,

Sihao Ding; [pdf] [arXiv]
[bibtex]
@InProceedings{Monninger_2026_WACV, author = {Monninger, Thomas and Zhang, Zihan and Staab, Steffen and Ding, Sihao}, title = {NavMapFusion: Diffusion-based Fusion of Navigation Maps for Online Vectorized HD Map Construction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7945-7954} }
DREAM: Dynamic Prompts and GuidedMix for Efficient Continual Adaptation of Visual-Language Models: Evelyn Chee,

Mong Li Lee,

Wynne Hsu; [pdf]
[bibtex]
@InProceedings{Chee_2026_WACV, author = {Chee, Evelyn and Lee, Mong Li and Hsu, Wynne}, title = {DREAM: Dynamic Prompts and GuidedMix for Efficient Continual Adaptation of Visual-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5853-5863} }
Overcoming Small Data Limitations in Video-Based Infant Respiration Estimation: Liyang Song,

Hardik Bishnoi,

Sai Kumar Reddy Manne,

Sarah Ostadabbas,

Briana J. Taylor,

Michael Wan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Song_2026_WACV, author = {Song, Liyang and Bishnoi, Hardik and Manne, Sai Kumar Reddy and Ostadabbas, Sarah and Taylor, Briana J. and Wan, Michael}, title = {Overcoming Small Data Limitations in Video-Based Infant Respiration Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6340-6349} }
Distribution Highlighted Reference-based Label Distribution Learning for Facial Age Estimation: Satoshi Suzuki,

Shin'ya Yamaguchi,

Shoichiro Takeda,

Takuhiro Kaneko,

Shota Orihashi,

Ryo Masumura; [pdf] [supp]
[bibtex]
@InProceedings{Suzuki_2026_WACV, author = {Suzuki, Satoshi and Yamaguchi, Shin'ya and Takeda, Shoichiro and Kaneko, Takuhiro and Orihashi, Shota and Masumura, Ryo}, title = {Distribution Highlighted Reference-based Label Distribution Learning for Facial Age Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6464-6473} }
IMKD: Intensity-Aware Multi-Level Knowledge Distillation for Camera-Radar Fusion: Shashank Mishra,

Karan Patil,

Didier Stricker,

Jason Rambach; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mishra_2026_WACV, author = {Mishra, Shashank and Patil, Karan and Stricker, Didier and Rambach, Jason}, title = {IMKD: Intensity-Aware Multi-Level Knowledge Distillation for Camera-Radar Fusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6027-6038} }
Leveraging Semantic Attribute Binding for Free-Lunch Color Control in Diffusion Models: Héctor Laria,

Alexandra Gomez-Villa,

Jiang Qin,

Muhammad Atif Butt,

Bogdan Raducanu,

Javier Vazquez-Corral,

Joost van de Weijer,

Kai Wang; [pdf] [supp]
[bibtex]
@InProceedings{Laria_2026_WACV, author = {Laria, H\'ector and Gomez-Villa, Alexandra and Qin, Jiang and Butt, Muhammad Atif and Raducanu, Bogdan and Vazquez-Corral, Javier and van de Weijer, Joost and Wang, Kai}, title = {Leveraging Semantic Attribute Binding for Free-Lunch Color Control in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7689-7698} }
ForestSplats: Deformable Transient Field for Gaussian Splatting in the Wild: Wongi Park,

Myeongseok Nam,

Siwon Kim,

Sangwoo Jo,

Soomok Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2026_WACV, author = {Park, Wongi and Nam, Myeongseok and Kim, Siwon and Jo, Sangwoo and Lee, Soomok}, title = {ForestSplats: Deformable Transient Field for Gaussian Splatting in the Wild}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6978-6987} }
3D Cell Oversegmentation Correction via Geo-Wasserstein Divergence: Peter Chen,

Bryan Chang,

Olivia A Creasey,

Julie Beth Sneddon,

Zev J Gartner,

Yining Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2026_WACV, author = {Chen, Peter and Chang, Bryan and A Creasey, Olivia and Sneddon, Julie Beth and Gartner, Zev J and Liu, Yining}, title = {3D Cell Oversegmentation Correction via Geo-Wasserstein Divergence}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7534-7543} }
STRinGS: Selective Text Refinement in Gaussian Splatting: Abhinav Raundhal,

Gaurav Behera,

P. J. Narayanan,

Ravi Kiran Sarvadevabhatla,

Makarand Tapaswi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Raundhal_2026_WACV, author = {Raundhal, Abhinav and Behera, Gaurav and Narayanan, P. J. and Sarvadevabhatla, Ravi Kiran and Tapaswi, Makarand}, title = {STRinGS: Selective Text Refinement in Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8574-8583} }
SceneEdited: A City-Scale Benchmark for 3D HD Map Updating via Image-Guided Change Detection: Chun-Jung Lin,

Tat-Jun Chin,

Sourav Garg,

Feras Dayoub; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2026_WACV, author = {Lin, Chun-Jung and Chin, Tat-Jun and Garg, Sourav and Dayoub, Feras}, title = {SceneEdited: A City-Scale Benchmark for 3D HD Map Updating via Image-Guided Change Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6330-6339} }
START: Spatial and Textual Learning for Chart Understanding: Zhuoming Liu,

Xiaofeng Gao,

Feiyang Niu,

Qiaozi Gao,

Liu Liu,

Robinson Piramuthu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liu_2026_WACV, author = {Liu, Zhuoming and Gao, Xiaofeng and Niu, Feiyang and Gao, Qiaozi and Liu, Liu and Piramuthu, Robinson}, title = {START: Spatial and Textual Learning for Chart Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8146-8156} }
Adversarial Pseudo-replay for Exemplar-free Class-incremental Learning: Hiroto Honda; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Honda_2026_WACV, author = {Honda, Hiroto}, title = {Adversarial Pseudo-replay for Exemplar-free Class-incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7493-7502} }
AugMapNet: Improving Spatial Latent Structure via BEV Grid Augmentation for Enhanced Vectorized Online HD Map Construction: Thomas Monninger,

Md Zafar Anwar,

Stanislaw Antol,

Steffen Staab,

Sihao Ding; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Monninger_2026_WACV, author = {Monninger, Thomas and Anwar, Md Zafar and Antol, Stanislaw and Staab, Steffen and Ding, Sihao}, title = {AugMapNet: Improving Spatial Latent Structure via BEV Grid Augmentation for Enhanced Vectorized Online HD Map Construction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8541-8550} }
Mem-MLP: Real-Time 3D Human Motion Generation from Sparse Inputs: Sinan Mutlu,

Georgios F. Angelis,

Savas Ozkan,

Paul Wisbey,

Anastasios Drosou,

Mete Ozay; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mutlu_2026_WACV, author = {Mutlu, Sinan and Angelis, Georgios F. and Ozkan, Savas and Wisbey, Paul and Drosou, Anastasios and Ozay, Mete}, title = {Mem-MLP: Real-Time 3D Human Motion Generation from Sparse Inputs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8343-8352} }
SurgXBench: Explainable Vision-Language Model Benchmark for Surgery: Jiajun Cheng,

Xianwu Zhao,

Sainan Liu,

Xiaofan Yu,

Ravi Prakash,

Patrick J. Codd,

Jonathan Elliott Katz,

Shan Lin; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cheng_2026_WACV, author = {Cheng, Jiajun and Zhao, Xianwu and Liu, Sainan and Yu, Xiaofan and Prakash, Ravi and Codd, Patrick J. and Katz, Jonathan Elliott and Lin, Shan}, title = {SurgXBench: Explainable Vision-Language Model Benchmark for Surgery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8188-8198} }
CanKD: Cross-Attention-based Non-local Operation for Feature-based Knowledge Distillation: Shizhe Sun,

Wataru Ohyama; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2026_WACV, author = {Sun, Shizhe and Ohyama, Wataru}, title = {CanKD: Cross-Attention-based Non-local Operation for Feature-based Knowledge Distillation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8606-8616} }
UniTabBank: A Large Scale Multi-Lingual, Multi-Layout, Multi-Type, Multi-Format Dataset for Table Detection: Ajoy Mondal,

Saumya Mundra,

Avijit Dasgupta,

C.V. Jawahar; [pdf] [supp]
[bibtex]
@InProceedings{Mondal_2026_WACV, author = {Mondal, Ajoy and Mundra, Saumya and Dasgupta, Avijit and Jawahar, C.V.}, title = {UniTabBank: A Large Scale Multi-Lingual, Multi-Layout, Multi-Type, Multi-Format Dataset for Table Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6486-6495} }
Being Positive about Negative Queries: Exclusion Aware Multimodal Retrieval using Disentangled Representations: Prachi Jha,

Sumit Bhatia,

Srikanta Bedathur; [pdf]
[bibtex]
@InProceedings{Jha_2026_WACV, author = {Jha, Prachi and Bhatia, Sumit and Bedathur, Srikanta}, title = {Being Positive about Negative Queries: Exclusion Aware Multimodal Retrieval using Disentangled Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7832-7841} }
CORA: Consistency-Guided Semi-Supervised Framework for Reasoning Segmentation: Prantik Howlader,

Hoang Nguyen-Canh,

Srijan Das,

Jingyi Xu,

Hieu Le,

Dimitris Samaras; [pdf] [supp]
[bibtex]
@InProceedings{Howlader_2026_WACV, author = {Howlader, Prantik and Nguyen-Canh, Hoang and Das, Srijan and Xu, Jingyi and Le, Hieu and Samaras, Dimitris}, title = {CORA: Consistency-Guided Semi-Supervised Framework for Reasoning Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5934-5944} }
Point2Pose: A Generative Framework for 3D Human Pose Estimation with Multi-View Point Cloud Dataset: Hyunsoo Lee,

Daeum Jeon,

Hyeokjae Oh; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2026_WACV, author = {Lee, Hyunsoo and Jeon, Daeum and Oh, Hyeokjae}, title = {Point2Pose: A Generative Framework for 3D Human Pose Estimation with Multi-View Point Cloud Dataset}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6744-6753} }
GDoFS: Gaussian DoF Separation for Plausible 3D Geometry in Sparse-View 3DGS: Yongsung Kim,

Jooyoung Choi,

Sungroh Yoon; [pdf] [supp]
[bibtex]
@InProceedings{Kim_2026_WACV, author = {Kim, Yongsung and Choi, Jooyoung and Yoon, Sungroh}, title = {GDoFS: Gaussian DoF Separation for Plausible 3D Geometry in Sparse-View 3DGS}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6643-6652} }
Distilling Offline Action Detection Models into Real-Time Streaming Models: Deep Patel,

Yasunori Babazaki,

Yasuto Nagase,

Iain Melvin,

Martin Renqiang Min; [pdf]
[bibtex]
@InProceedings{Patel_2026_WACV, author = {Patel, Deep and Babazaki, Yasunori and Nagase, Yasuto and Melvin, Iain and Min, Martin Renqiang}, title = {Distilling Offline Action Detection Models into Real-Time Streaming Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6205-6214} }
Remote Sensing Forestry Similarity Convolution: Shikuan Wang,

Yuangong Chen,

Jianzhou Gong,

Lingyi Meng,

Mengquan Wu,

Longxing Liu,

Haiwei Yuan,

Mingbin Guo; [pdf]
[bibtex]
@InProceedings{Wang_2026_WACV, author = {Wang, Shikuan and Chen, Yuangong and Gong, Jianzhou and Meng, Lingyi and Wu, Mengquan and Liu, Longxing and Yuan, Haiwei and Guo, Mingbin}, title = {Remote Sensing Forestry Similarity Convolution}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7565-7575} }
Multimodal Graph Representation Learning over Arbitrary Sets of Modalities: Santosh Patapati,

Trisanth Srinivasan; [pdf] [supp]
[bibtex]
@InProceedings{Patapati_2026_WACV, author = {Patapati, Santosh and Srinivasan, Trisanth}, title = {Multimodal Graph Representation Learning over Arbitrary Sets of Modalities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7104-7115} }
Uncertainty-Aware Vision-Language Segmentation for Medical Imaging: Aryan Das,

Tanishq Rachamalla,

Koushik Biswas,

Swalpa Kumar Roy,

Vinay Kumar Verma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Das_2026_WACV, author = {Das, Aryan and Rachamalla, Tanishq and Biswas, Koushik and Roy, Swalpa Kumar and Verma, Vinay Kumar}, title = {Uncertainty-Aware Vision-Language Segmentation for Medical Imaging}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8490-8499} }
SeqFeedNet: Sequential Feature Feedback Network for Background Subtraction: Yu-Shun Huang,

Jing-Ming Guo,

Yi-Xiang Yang; [pdf] [supp]
[bibtex]
@InProceedings{Huang_2026_WACV, author = {Huang, Yu-Shun and Guo, Jing-Ming and Yang, Yi-Xiang}, title = {SeqFeedNet: Sequential Feature Feedback Network for Background Subtraction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8199-8208} }
Crash2DocAI: Automated Integration of Post-Crash Car Part Images into Technical Reports: Vaclav Divis,

Jessica Giovagnola,

Khalil Ben Chikha,

Marek Hrúz; [pdf]
[bibtex]
@InProceedings{Divis_2026_WACV, author = {Divis, Vaclav and Giovagnola, Jessica and Ben Chikha, Khalil and Hr\'uz, Marek}, title = {Crash2DocAI: Automated Integration of Post-Crash Car Part Images into Technical Reports}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8272-8281} }
From Prompt to Production: Automating Brand-Safe Marketing Imagery with Text-to-Image Models: Parmida Atighehchian,

Henry Wang,

Andrei Kapustin,

Boris Lerner,

Tiancheng Jiang,

Taylor Jensen,

Negin Sokhandan; [pdf] [supp]
[bibtex]
@InProceedings{Atighehchian_2026_WACV, author = {Atighehchian, Parmida and Wang, Henry and Kapustin, Andrei and Lerner, Boris and Jiang, Tiancheng and Jensen, Taylor and Sokhandan, Negin}, title = {From Prompt to Production: Automating Brand-Safe Marketing Imagery with Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6818-6826} }
MaxInfo: A Training-Free Key-Frame Selection Method Using Maximum Volume for Enhanced Video Understanding: Pengyi Li,

Irina Abdullaeva,

Alexander Gambashidze,

Andrey Kuznetsov,

Ivan Oseledets; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2026_WACV, author = {Li, Pengyi and Abdullaeva, Irina and Gambashidze, Alexander and Kuznetsov, Andrey and Oseledets, Ivan}, title = {MaxInfo: A Training-Free Key-Frame Selection Method Using Maximum Volume for Enhanced Video Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7198-7207} }
SDT-6D: Fully Sparse Depth-Transformer for Staged End-to-End 6D Pose Estimation in Industrial Multi-View Bin Picking: Nico Leuze,

Maximilian Hoh,

Samed Doğan,

Nicolas R.-Peña,

Alfred Schoettl; [pdf]
[bibtex]
@InProceedings{Leuze_2026_WACV, author = {Leuze, Nico and Hoh, Maximilian and Do\u{g}an, Samed and R.-Pe\~na, Nicolas and Schoettl, Alfred}, title = {SDT-6D: Fully Sparse Depth-Transformer for Staged End-to-End 6D Pose Estimation in Industrial Multi-View Bin Picking}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8406-8415} }
VideoSketcher: A Training-Free Approach for Coherent Video Sketch Transfer: Huining Li,

Bangzhen Liu,

Rui Yang,

Yang Zhou,

Chenshu Xu,

Xufang Pang,

Shengfeng He; [pdf] [supp]
[bibtex]
@InProceedings{Li_2026_WACV, author = {Li, Huining and Liu, Bangzhen and Yang, Rui and Zhou, Yang and Xu, Chenshu and Pang, Xufang and He, Shengfeng}, title = {VideoSketcher: A Training-Free Approach for Coherent Video Sketch Transfer}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7333-7343} }
From Darkness to Detail: Frequency-Aware SSMs for Low-Light Vision: Eashan Adhikarla,

Kai Zhang,

Gong Chen,

John Nicholson,

Brian D. Davison; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Adhikarla_2026_WACV, author = {Adhikarla, Eashan and Zhang, Kai and Chen, Gong and Nicholson, John and Davison, Brian D.}, title = {From Darkness to Detail: Frequency-Aware SSMs for Low-Light Vision}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6956-6967} }
Mean-Shift Distillation for Diffusion Mode Seeking: Vikas Thamizharasan,

Nikitas Chatzis,

Iliyan Georgiev,

Matthew Fisher,

Evangelos Kalogerakis,

Difan Liu,

Nanxuan Zhao,

Michal Lukáč; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Thamizharasan_2026_WACV, author = {Thamizharasan, Vikas and Chatzis, Nikitas and Georgiev, Iliyan and Fisher, Matthew and Kalogerakis, Evangelos and Liu, Difan and Zhao, Nanxuan and Luk\'a\v{c}, Michal}, title = {Mean-Shift Distillation for Diffusion Mode Seeking}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6537-6546} }
ISALux: Illumination and Semantics-Aware Transformer Employing Mixture of Experts for Low Light Image Enhancement: Raul Balmez,

Alexandru Brateanu,

Ciprian Orhei,

Codruta O. Ancuti,

Cosmin Ancuti; [pdf] [supp]
[bibtex]
@InProceedings{Balmez_2026_WACV, author = {Balmez, Raul and Brateanu, Alexandru and Orhei, Ciprian and Ancuti, Codruta O. and Ancuti, Cosmin}, title = {ISALux: Illumination and Semantics-Aware Transformer Employing Mixture of Experts for Low Light Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7862-7872} }
SVS-GAN for Semantic Synthesis of Traffic Videos for Autonomous Driving: Khaled M. Seyam,

Julian Wiederer,

Markus Braun,

Bin Yang; [pdf] [supp]
[bibtex]
@InProceedings{Seyam_2026_WACV, author = {Seyam, Khaled M. and Wiederer, Julian and Braun, Markus and Yang, Bin}, title = {SVS-GAN for Semantic Synthesis of Traffic Videos for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8650-8659} }
Memoire: Learning User Personas from Gallery Tags for Personalized Photo Curation: Praful Mathur,

Mohsin Iftekhar,

Aman Sharma,

Sarvesh Tiwari,

Meghali Deka,

Sathish Cherukuri,

K Roopa Sheshadri,

Rakesh Valusa; [pdf] [supp]
[bibtex]
@InProceedings{Mathur_2026_WACV, author = {Mathur, Praful and Iftekhar, Mohsin and Sharma, Aman and Tiwari, Sarvesh and Deka, Meghali and Cherukuri, Sathish and Sheshadri, K Roopa and Valusa, Rakesh}, title = {Memoire: Learning User Personas from Gallery Tags for Personalized Photo Curation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6873-6882} }
Boosting Unsupervised Video Instance Segmentation with Automatic Quality-Guided Self-Training: Kaixuan Lu,

Mehmet Onurcan Kaya,

Dim P. Papadopoulos; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lu_2026_WACV, author = {Lu, Kaixuan and Kaya, Mehmet Onurcan and Papadopoulos, Dim P.}, title = {Boosting Unsupervised Video Instance Segmentation with Automatic Quality-Guided Self-Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7387-7397} }
Test Time Adaptation Using Adaptive Quantile Recalibration: Paria Mehrbod,

Pedro Vianna,

Geraldin Nanfack,

Guy Wolf,

Eugene Belilovsky; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mehrbod_2026_WACV, author = {Mehrbod, Paria and Vianna, Pedro and Nanfack, Geraldin and Wolf, Guy and Belilovsky, Eugene}, title = {Test Time Adaptation Using Adaptive Quantile Recalibration}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5986-5995} }
SceneEval: Evaluating Semantic Coherence in Text-Conditioned 3D Indoor Scene Synthesis: Hou In Ivan Tam,

Hou In Derek Pun,

Austin T. Wang,

Angel X. Chang,

Manolis Savva; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tam_2026_WACV, author = {Tam, Hou In Ivan and Pun, Hou In Derek and Wang, Austin T. and Chang, Angel X. and Savva, Manolis}, title = {SceneEval: Evaluating Semantic Coherence in Text-Conditioned 3D Indoor Scene Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7355-7365} }
Rethinking Latent Variable in Learned Image Compression: Fangzhou Yi,

Zhicheng Gong,

Hui Zeng; [pdf] [supp]
[bibtex]
@InProceedings{Yi_2026_WACV, author = {Yi, Fangzhou and Gong, Zhicheng and Zeng, Hui}, title = {Rethinking Latent Variable in Learned Image Compression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8531-8540} }
MUSE: Model-based Uncertainty-aware Similarity Estimation for zero-shot 2D Object Detection and Segmentation: Sungmin Cho,

Sungbum Park,

Insoo Oh; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cho_2026_WACV, author = {Cho, Sungmin and Park, Sungbum and Oh, Insoo}, title = {MUSE: Model-based Uncertainty-aware Similarity Estimation for zero-shot 2D Object Detection and Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6090-6100} }
Modeling and Learning Multiple Hypotheses for Monocular 3D Object Detection: Hyeonjeong Park,

Peixi Xiong,

Pei Yu,

Wei Tang; [pdf] [supp]
[bibtex]
@InProceedings{Park_2026_WACV, author = {Park, Hyeonjeong and Xiong, Peixi and Yu, Pei and Tang, Wei}, title = {Modeling and Learning Multiple Hypotheses for Monocular 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7040-7050} }
SD-CSFL: A Synthetic Data-Driven Conformity Scoring Framework for Robust Federated Learning: Ebtisaam Alharbi,

Abdulrahman Kerim,

Leandro Soriano Marcolino,

Qiang Ni; [pdf] [supp]
[bibtex]
@InProceedings{Alharbi_2026_WACV, author = {Alharbi, Ebtisaam and Kerim, Abdulrahman and Marcolino, Leandro Soriano and Ni, Qiang}, title = {SD-CSFL: A Synthetic Data-Driven Conformity Scoring Framework for Robust Federated Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6903-6912} }
MedROV: Towards Real-Time Open-Vocabulary Detection Across Diverse Medical Imaging Modalities: Tooba Tehreem Sheikh,

Jean Lahoud,

Rao Muhammad Anwer,

Fahad Shahbaz Khan,

Salman Khan,

Hisham Cholakkal; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sheikh_2026_WACV, author = {Sheikh, Tooba Tehreem and Lahoud, Jean and Anwer, Rao Muhammad and Khan, Fahad Shahbaz and Khan, Salman and Cholakkal, Hisham}, title = {MedROV: Towards Real-Time Open-Vocabulary Detection Across Diverse Medical Imaging Modalities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8628-8638} }
Towards Unconstrained Cross-View Pose Estimation: Alexander Wollam,

Kyle Ashley,

Maxim Shugaev,

Oliver Arend,

Ilya Semenov,

Hadis Dashtestani,

Sumved Ravi,

Nathan Jacobs; [pdf] [supp]
[bibtex]
@InProceedings{Wollam_2026_WACV, author = {Wollam, Alexander and Ashley, Kyle and Shugaev, Maxim and Arend, Oliver and Semenov, Ilya and Dashtestani, Hadis and Ravi, Sumved and Jacobs, Nathan}, title = {Towards Unconstrained Cross-View Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8448-8457} }
FocalComm: Hard Instance-Aware Multi-Agent Perception: Dereje Shenkut,

Vijayakumar Bhagavatula; [pdf] [arXiv]
[bibtex]
@InProceedings{Shenkut_2026_WACV, author = {Shenkut, Dereje and Bhagavatula, Vijayakumar}, title = {FocalComm: Hard Instance-Aware Multi-Agent Perception}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6277-6286} }
Video and Language Alignment in 2D Systems for 3D Multi-object Scenes with Multi-Information Derivative-Free Control: Jason Armitage,

Rico Sennrich; [pdf] [supp]
[bibtex]
@InProceedings{Armitage_2026_WACV, author = {Armitage, Jason and Sennrich, Rico}, title = {Video and Language Alignment in 2D Systems for 3D Multi-object Scenes with Multi-Information Derivative-Free Control}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6266-6276} }
GaussianHeadTalk: Wobble-Free 3D Talking Heads with Audio Driven Gaussian Splatting: Madhav Agarwal,

Mingtian Zhang,

Laura Sevilla-Lara,

Steven McDonagh; [pdf] [supp]
[bibtex]
@InProceedings{Agarwal_2026_WACV, author = {Agarwal, Madhav and Zhang, Mingtian and Sevilla-Lara, Laura and McDonagh, Steven}, title = {GaussianHeadTalk: Wobble-Free 3D Talking Heads with Audio Driven Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8017-8027} }
SVD-Det: A Lightweight Framework for Video Forgery Detection Using Semantic and Visual Defect Cues: Tsung-Shan Yang,

Tianyu Zhang,

Feng Qian,

Bing Yan,

C.-C. Jay Kuo; [pdf] [supp]
[bibtex]
@InProceedings{Yang_2026_WACV, author = {Yang, Tsung-Shan and Zhang, Tianyu and Qian, Feng and Yan, Bing and Kuo, C.-C. Jay}, title = {SVD-Det: A Lightweight Framework for Video Forgery Detection Using Semantic and Visual Defect Cues}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7616-7625} }
FastHMR: Accelerating Human Mesh Recovery via Token and Layer Merging with Diffusion Decoding: Soroush Mehraban,

Andrea Iaboni,

Babak Taati; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mehraban_2026_WACV, author = {Mehraban, Soroush and Iaboni, Andrea and Taati, Babak}, title = {FastHMR: Accelerating Human Mesh Recovery via Token and Layer Merging with Diffusion Decoding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6733-6743} }
See, Think, Learn: A Self-Taught Multimodal Reasoner: Sourabh Sharma,

Sonam Gupta,

Sadbhawna Sadbhawna; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sharma_2026_WACV, author = {Sharma, Sourabh and Gupta, Sonam and Sadbhawna, Sadbhawna}, title = {See, Think, Learn: A Self-Taught Multimodal Reasoner}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8313-8322} }
CSF-Net: Context-Semantic Fusion Network for Large Mask Inpainting: Chae-Yeon Heo,

Yeong-Jun Cho; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Heo_2026_WACV, author = {Heo, Chae-Yeon and Cho, Yeong-Jun}, title = {CSF-Net: Context-Semantic Fusion Network for Large Mask Inpainting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8292-8301} }
Virtually Unrolling the Herculaneum Papyri by Diffeomorphic Spiral Fitting: Paul Henderson; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Henderson_2026_WACV, author = {Henderson, Paul}, title = {Virtually Unrolling the Herculaneum Papyri by Diffeomorphic Spiral Fitting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6401-6411} }
Exploring the Boundaries of Diffusion Models for Offline Writer Identification with Sparse and Intra-Variable Data: Aritra Dey,

Chandranath Adak,

Kumari Priya,

Soumi Chattopadhyay,

Sukalpa Chanda; [pdf] [supp]
[bibtex]
@InProceedings{Dey_2026_WACV, author = {Dey, Aritra and Adak, Chandranath and Priya, Kumari and Chattopadhyay, Soumi and Chanda, Sukalpa}, title = {Exploring the Boundaries of Diffusion Models for Offline Writer Identification with Sparse and Intra-Variable Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7178-7187} }
Hierarchical Instance Tracking to Balance Privacy Preservation with Accessible Information: Neelima Prasad,

Jarek Reynolds,

Neel Karsanbhai,

Tanusree Sharma,

Lotus Zhang,

Abigale Stangl,

Yang Wang,

Leah Findlater,

Danna Gurari; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Prasad_2026_WACV, author = {Prasad, Neelima and Reynolds, Jarek and Karsanbhai, Neel and Sharma, Tanusree and Zhang, Lotus and Stangl, Abigale and Wang, Yang and Findlater, Leah and Gurari, Danna}, title = {Hierarchical Instance Tracking to Balance Privacy Preservation with Accessible Information}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5945-5955} }
Photo Dating by Facial Age Aggregation: Jakub Paplhám,

Vojtěch Franc; [pdf] [supp]
[bibtex]
@InProceedings{Paplham_2026_WACV, author = {Paplh\'am, Jakub and Franc, Vojt\v{e}ch}, title = {Photo Dating by Facial Age Aggregation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8103-8112} }
Test-Time Consistency in Vision Language Models: Shih-Han Chou,

Shivam Chandhok,

James J. Little,

Leonid Sigal; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chou_2026_WACV, author = {Chou, Shih-Han and Chandhok, Shivam and Little, James J. and Sigal, Leonid}, title = {Test-Time Consistency in Vision Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7789-7798} }
CSGaussian: Progressive Rate-Distortion Compression and Segmentation for 3D Gaussian Splatting: Yu-Jen Tseng,

Chia-Hao Kao,

Jing-Zhong Chen,

Alessandro Gnutti,

Shao-Yuan Lo,

Yen-Yu Lin,

Wen-Hsiao Peng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tseng_2026_WACV, author = {Tseng, Yu-Jen and Kao, Chia-Hao and Chen, Jing-Zhong and Gnutti, Alessandro and Lo, Shao-Yuan and Lin, Yen-Yu and Peng, Wen-Hsiao}, title = {CSGaussian: Progressive Rate-Distortion Compression and Segmentation for 3D Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6883-6892} }
Conversational Image Generation: Towards Multi-Round Personalized Generation with Multi-Modal Language Models: Haochen Zhang,

Animesh Sinha,

Felix Juefei-Xu,

Haoyu Ma,

Kunpeng Li,

Zhipeng Fan,

Xiaoliang Dai,

Tingbo Hou,

Peizhao Zhang,

Zecheng He; [pdf] [supp]
[bibtex]
@InProceedings{Zhang_2026_WACV, author = {Zhang, Haochen and Sinha, Animesh and Juefei-Xu, Felix and Ma, Haoyu and Li, Kunpeng and Fan, Zhipeng and Dai, Xiaoliang and Hou, Tingbo and Zhang, Peizhao and He, Zecheng}, title = {Conversational Image Generation: Towards Multi-Round Personalized Generation with Multi-Modal Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8282-8291} }
PhyEduVideo: A Benchmark for Evaluating Text-to-Video Models for Physics Education: Megha Mariam K.M,

Aditya Arun,

Zakaria Laskar,

C.V. Jawahar; [pdf] [supp]
[bibtex]
@InProceedings{K.M_2026_WACV, author = {K.M, Megha Mariam and Arun, Aditya and Laskar, Zakaria and Jawahar, C.V.}, title = {PhyEduVideo: A Benchmark for Evaluating Text-to-Video Models for Physics Education}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8690-8699} }
PEaRL: Pathway-Enhanced Representation Learning for Gene and Pathway Expression Prediction from Histology: Sejuti Majumder,

Saarthak Kapse,

Moinak Bhattacharya,

Xuan Xu,

Alisa Yurovsky,

Prateek Prasanna; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Majumder_2026_WACV, author = {Majumder, Sejuti and Kapse, Saarthak and Bhattacharya, Moinak and Xu, Xuan and Yurovsky, Alisa and Prasanna, Prateek}, title = {PEaRL: Pathway-Enhanced Representation Learning for Gene and Pathway Expression Prediction from Histology}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8052-8062} }
FastPose-ViT: A Vision Transformer for Real-Time Spacecraft Pose Estimation: Pierre Ancey,

Andrew Price,

Saqib Javed,

Mathieu Salzmann; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ancey_2026_WACV, author = {Ancey, Pierre and Price, Andrew and Javed, Saqib and Salzmann, Mathieu}, title = {FastPose-ViT: A Vision Transformer for Real-Time Spacecraft Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7873-7882} }
Improvise, Adapt, Overcome -- Telescopic Adapters for Efficient Fine-tuning of Vision Language Models in Medical Imaging: Ujjwal Mishra,

Vinita Shukla,

Praful Hambarde,

Amit Shukla; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mishra_2026_WACV, author = {Mishra, Ujjwal and Shukla, Vinita and Hambarde, Praful and Shukla, Amit}, title = {Improvise, Adapt, Overcome -- Telescopic Adapters for Efficient Fine-tuning of Vision Language Models in Medical Imaging}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7605-7615} }
Zero-LEAD: Source-Free Universal Domain Adaptation for Abdominal Multi-Organ Segmentation: Ahmed El-Sayed,

Marwan Torki; [pdf]
[bibtex]
@InProceedings{El-Sayed_2026_WACV, author = {El-Sayed, Ahmed and Torki, Marwan}, title = {Zero-LEAD: Source-Free Universal Domain Adaptation for Abdominal Multi-Organ Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6715-6723} }
Dual-Domain Multimodal Hyperbolic Fusion for Cardiopulmonary Disease Diagnosis in Emergency Care: Ke Nan,

Maggie Samaan,

Benjamin Burns,

Xia Ning,

Yuchi Han,

Yuan Xue; [pdf]
[bibtex]
@InProceedings{Nan_2026_WACV, author = {Nan, Ke and Samaan, Maggie and Burns, Benjamin and Ning, Xia and Han, Yuchi and Xue, Yuan}, title = {Dual-Domain Multimodal Hyperbolic Fusion for Cardiopulmonary Disease Diagnosis in Emergency Care}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8700-8710} }
Procedure Learning via Regularized Gromov-Wasserstein Optimal Transport: Syed Ahmed Mahmood,

Ali Shah Ali,

Umer Ahmed,

Fawad Javed Fateh,

M. Zeeshan Zia,

Quoc-Huy Tran; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mahmood_2026_WACV, author = {Mahmood, Syed Ahmed and Ali, Ali Shah and Ahmed, Umer and Fateh, Fawad Javed and Zia, M. Zeeshan and Tran, Quoc-Huy}, title = {Procedure Learning via Regularized Gromov-Wasserstein Optimal Transport}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6925-6935} }
PDV: Prompt Directional Vectors for Zero-shot Composed Image Retrieval: Osman Tursun,

Sinan Kalkan,

Simon Denman,

Clinton Fookes; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tursun_2026_WACV, author = {Tursun, Osman and Kalkan, Sinan and Denman, Simon and Fookes, Clinton}, title = {PDV: Prompt Directional Vectors for Zero-shot Composed Image Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7740-7749} }
Any Detector Can Detect Anything: Thomas E. Huang,

Siyuan Li,

Martin Danelljan,

Henghui Ding,

Luc Van Gool,

Fisher Yu; [pdf] [supp]
[bibtex]
@InProceedings{Huang_2026_WACV, author = {Huang, Thomas E. and Li, Siyuan and Danelljan, Martin and Ding, Henghui and Van Gool, Luc and Yu, Fisher}, title = {Any Detector Can Detect Anything}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8437-8447} }
Automated Suturing Skill Assessment in Robot-assisted Surgery from Endoscopic Videos using Clinically-guided Evaluation Criteria: Atharva Sunil Deo,

Ujjwal Pasupulety,

Nicholas Matsumoto,

Jay Moran,

Cherine Yang,

Jeanine Kim,

Rafal Dariusz Kocielnik,

Aurash Naser-Tavakolian,

Andrew Hung; [pdf]
[bibtex]
@InProceedings{Deo_2026_WACV, author = {Deo, Atharva Sunil and Pasupulety, Ujjwal and Matsumoto, Nicholas and Moran, Jay and Yang, Cherine and Kim, Jeanine and Kocielnik, Rafal Dariusz and Naser-Tavakolian, Aurash and Hung, Andrew}, title = {Automated Suturing Skill Assessment in Robot-assisted Surgery from Endoscopic Videos using Clinically-guided Evaluation Criteria}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7218-7228} }
Polymorph: Energy-Efficient Multi-Label Classification for Video Streams on Embedded Devices: Saeid Ghafouri,

Mohsen Fayyaz,

Xiangchen Li,

Deepu John,

Bo Ji,

Dimitrios S. Nikolopoulos,

Hans Vandierendonck; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ghafouri_2026_WACV, author = {Ghafouri, Saeid and Fayyaz, Mohsen and Li, Xiangchen and John, Deepu and Ji, Bo and Nikolopoulos, Dimitrios S. and Vandierendonck, Hans}, title = {Polymorph: Energy-Efficient Multi-Label Classification for Video Streams on Embedded Devices}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6432-6441} }
VectorSynth: Fine-Grained Satellite Image Synthesis with Structured Semantics: Daniel Cher,

Brian Wei,

Srikumar Sastry,

Nathan Jacobs; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cher_2026_WACV, author = {Cher, Daniel and Wei, Brian and Sastry, Srikumar and Jacobs, Nathan}, title = {VectorSynth: Fine-Grained Satellite Image Synthesis with Structured Semantics}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7019-7029} }
DiffRegCD: Integrated Registration and Change Detection with Diffusion Features: Seyedehanita Madani,

Rama Chellappa,

Vishal M. Patel; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Madani_2026_WACV, author = {Madani, Seyedehanita and Chellappa, Rama and Patel, Vishal M.}, title = {DiffRegCD: Integrated Registration and Change Detection with Diffusion Features}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7503-7512} }
LangPose: Language-Aligned Motion for Robust 3D Human Pose Estimation: Longyun Liao,

Rong Zheng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liao_2026_WACV, author = {Liao, Longyun and Zheng, Rong}, title = {LangPose: Language-Aligned Motion for Robust 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8073-8083} }
CLIP-UP: CLIP-Based Unanswerable Problem Detection for Visual Question Answering: Ben Vardi,

Oron Nir,

Ariel Shamir; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Vardi_2026_WACV, author = {Vardi, Ben and Nir, Oron and Shamir, Ariel}, title = {CLIP-UP: CLIP-Based Unanswerable Problem Detection for Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5898-5908} }
Beyond Paired Data: Self-Supervised UAV Geo-Localization from Reference Imagery Alone: Tristan Amadei,

Enric Meinhardt-Llopis,

Benedicte Bascle,

Corentin Abgrall,

Gabriele Facciolo; [pdf] [supp]
[bibtex]
@InProceedings{Amadei_2026_WACV, author = {Amadei, Tristan and Meinhardt-Llopis, Enric and Bascle, Benedicte and Abgrall, Corentin and Facciolo, Gabriele}, title = {Beyond Paired Data: Self-Supervised UAV Geo-Localization from Reference Imagery Alone}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7409-7419} }
Training-Free Few-Shot Segmentation via Vision-Language Guided Prompting: Euihyun Yoon,

Taejin Park,

Jaekoo Lee; [pdf]
[bibtex]
@InProceedings{Yoon_2026_WACV, author = {Yoon, Euihyun and Park, Taejin and Lee, Jaekoo}, title = {Training-Free Few-Shot Segmentation via Vision-Language Guided Prompting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6517-6526} }
HDR Reconstruction Boosting with Training-Free and Exposure-Consistent Diffusion: Yo-Tin Lin,

Su-Kai Chen,

Hou-Ning Hu,

Yen-Yu Lin,

Yu-Lun Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2026_WACV, author = {Lin, Yo-Tin and Chen, Su-Kai and Hu, Hou-Ning and Lin, Yen-Yu and Liu, Yu-Lun}, title = {HDR Reconstruction Boosting with Training-Free and Exposure-Consistent Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7513-7523} }
Exploring Automated Recognition of Instructional Activity and Discourse from Multimodal Classroom Data: Ivo Bueno,

Ruikun Hou,

Babette Bühler,

Tim Fütterer,

James Drimalla,

Jonathan K. Foster,

Peter Youngs,

Peter Gerjets,

Ulrich Trautwein,

Enkelejda Kasneci; [pdf] [supp]
[bibtex]
@InProceedings{Bueno_2026_WACV, author = {Bueno, Ivo and Hou, Ruikun and B\"uhler, Babette and F\"utterer, Tim and Drimalla, James and Foster, Jonathan K. and Youngs, Peter and Gerjets, Peter and Trautwein, Ulrich and Kasneci, Enkelejda}, title = {Exploring Automated Recognition of Instructional Activity and Discourse from Multimodal Classroom Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6806-6817} }
SCAdapter: Content-Style Disentanglement for Diffusion Style Transfer: Luan Thanh Trinh; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Trinh_2026_WACV, author = {Trinh, Luan Thanh}, title = {SCAdapter: Content-Style Disentanglement for Diffusion Style Transfer}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7312-7321} }
Equivariant Sampling for Improving Diffusion Model-based Image Restoration: Chenxu Wu,

Qingpeng Kong,

Peiang Zhao,

Wendi Yang,

Wenxin Ma,

Fenghe Tang,

Zihang Jiang,

S.Kevin Zhou; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2026_WACV, author = {Wu, Chenxu and Kong, Qingpeng and Zhao, Peiang and Yang, Wendi and Ma, Wenxin and Tang, Fenghe and Jiang, Zihang and Zhou, S.Kevin}, title = {Equivariant Sampling for Improving Diffusion Model-based Image Restoration}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6827-6839} }
AuViRe: Audio-visual Speech Representation Reconstruction for Deepfake Temporal Localization: Christos Koutlis,

Symeon Papadopoulos; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Koutlis_2026_WACV, author = {Koutlis, Christos and Papadopoulos, Symeon}, title = {AuViRe: Audio-visual Speech Representation Reconstruction for Deepfake Temporal Localization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7168-7177} }
Predicting Task fMRI Contrasts from Resting-State fMRI Using Sparse 3D Convolutions: Ivan Sviridov,

Maria Boyko,

Maksim Sharaev; [pdf]
[bibtex]
@InProceedings{Sviridov_2026_WACV, author = {Sviridov, Ivan and Boyko, Maria and Sharaev, Maksim}, title = {Predicting Task fMRI Contrasts from Resting-State fMRI Using Sparse 3D Convolutions}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6320-6329} }
Causality-Driven Audits of Model Robustness: Nathan Drenkow,

William Paul,

Chris Ribaudo,

Mathias Unberath; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Drenkow_2026_WACV, author = {Drenkow, Nathan and Paul, William and Ribaudo, Chris and Unberath, Mathias}, title = {Causality-Driven Audits of Model Robustness}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5956-5966} }
Pointmap-Conditioned Diffusion for Consistent Novel View Synthesis: Thang-Anh-Quan Nguyen,

Laurent Caraffa,

Jean-Philippe Tarel,

Roland Brémond; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Thang-Anh-Quan and Caraffa, Laurent and Tarel, Jean-Philippe and Br\'emond, Roland}, title = {Pointmap-Conditioned Diffusion for Consistent Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6360-6370} }
Reciprocal Teaching: Dynamic Multi-Model Teacher-Student Learning for Multiple Noisy Annotations: Wenjie Ai,

Cuong C. Nguyen,

Adrian Hilton,

Gustavo Carneiro; [pdf] [supp]
[bibtex]
@InProceedings{Ai_2026_WACV, author = {Ai, Wenjie and Nguyen, Cuong C. and Hilton, Adrian and Carneiro, Gustavo}, title = {Reciprocal Teaching: Dynamic Multi-Model Teacher-Student Learning for Multiple Noisy Annotations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8376-8385} }
RampWatch: An In-the-Wild Dataset and Text-Guided Detection Framework for Recreational Vessels: Malik Muhammad Asim,

Claire B. Smallwood,

Abdullah Tariq,

Johnny Lo,

Syed Zulqarnain Gilani; [pdf] [supp]
[bibtex]
@InProceedings{Asim_2026_WACV, author = {Asim, Malik Muhammad and Smallwood, Claire B. and Tariq, Abdullah and Lo, Johnny and Gilani, Syed Zulqarnain}, title = {RampWatch: An In-the-Wild Dataset and Text-Guided Detection Framework for Recreational Vessels}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7576-7585} }
Q-Former Autoencoder: A Modern Framework for Medical Anomaly Detection: Francesco Dalmonte,

Emirhan Bayar,

Emre Akbas,

Mariana-Iuliana Georgescu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dalmonte_2026_WACV, author = {Dalmonte, Francesco and Bayar, Emirhan and Akbas, Emre and Georgescu, Mariana-Iuliana}, title = {Q-Former Autoencoder: A Modern Framework for Medical Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7985-7995} }
MoSCo: Real-time and Efficient Text-to-Motion Synthesis via Delta Training: Zhiyuan Zhang,

Lingqiao Liu; [pdf]
[bibtex]
@InProceedings{Zhang_2026_WACV, author = {Zhang, Zhiyuan and Liu, Lingqiao}, title = {MoSCo: Real-time and Efficient Text-to-Motion Synthesis via Delta Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6298-6308} }
Splannequin: Freezing Monocular Mannequin-Challenge Footage with Dual-Detection Splatting: Hao-Jen Chien,

Yi-Chuan Huang,

Chung-Ho Wu,

Wei-Lun Chao,

Yu-Lun Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chien_2026_WACV, author = {Chien, Hao-Jen and Huang, Yi-Chuan and Wu, Chung-Ho and Chao, Wei-Lun and Liu, Yu-Lun}, title = {Splannequin: Freezing Monocular Mannequin-Challenge Footage with Dual-Detection Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8028-8040} }
Hybrid State Representation for Video Procedure Planning: Woo Suk Choi,

Youwon Jang,

Minsu Lee,

Byoung-Tak Zhang; [pdf] [supp]
[bibtex]
@InProceedings{Choi_2026_WACV, author = {Choi, Woo Suk and Jang, Youwon and Lee, Minsu and Zhang, Byoung-Tak}, title = {Hybrid State Representation for Video Procedure Planning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6507-6516} }
Diagnose Like A REAL Pathologist: An Uncertainty-Focused Approach for Trustworthy Multi-Resolution Multiple Instance Learning: Sungrae Hong,

Sol Lee,

Jisu Shin,

Jiwon Jeong,

Mun Yong Yi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hong_2026_WACV, author = {Hong, Sungrae and Lee, Sol and Shin, Jisu and Jeong, Jiwon and Yi, Mun Yong}, title = {Diagnose Like A REAL Pathologist: An Uncertainty-Focused Approach for Trustworthy Multi-Resolution Multiple Instance Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6132-6141} }
Align Video Diffusion Model with Online Video-Centric Preference Optimization: Jiacheng Zhang,

Jie Wu,

Weifeng Chen,

Yatai Ji,

Xuefeng Xiao,

Weilin Huang,

Kai Han; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhang_2026_WACV, author = {Zhang, Jiacheng and Wu, Jie and Chen, Weifeng and Ji, Yatai and Xiao, Xuefeng and Huang, Weilin and Han, Kai}, title = {Align Video Diffusion Model with Online Video-Centric Preference Optimization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6142-6152} }
AortaDiff: A Unified Multitask Diffusion Framework for Contrast-Free AAA Imaging: Yuxuan Ou,

Ning Bi,

Jiazhen Pan,

Jiancheng Yang,

Boliang Yu,

Usama Zidan,

Regent Lee,

Vicente Grau; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ou_2026_WACV, author = {Ou, Yuxuan and Bi, Ning and Pan, Jiazhen and Yang, Jiancheng and Yu, Boliang and Zidan, Usama and Lee, Regent and Grau, Vicente}, title = {AortaDiff: A Unified Multitask Diffusion Framework for Contrast-Free AAA Imaging}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8242-8251} }
High-Level Semantics and Low-Level Features Fusion for Multi-Scale Object Detection in Dynamic Construction Environments: Mahdi Bonyani,

Maryam Soleymani,

Chao Wang; [pdf]
[bibtex]
@InProceedings{Bonyani_2026_WACV, author = {Bonyani, Mahdi and Soleymani, Maryam and Wang, Chao}, title = {High-Level Semantics and Low-Level Features Fusion for Multi-Scale Object Detection in Dynamic Construction Environments}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6527-6536} }
AusSmoke meets MultiNatSmoke: a fully-labelled diverse smoke segmentation dataset: Weihao Li,

Hongjin Zhao,

Gao Zhu,

Ge-Peng Ji,

Nicholas Wilson,

Marta Yebra,

Nick Barnes; [pdf]
[bibtex]
@InProceedings{Li_2026_WACV, author = {Li, Weihao and Zhao, Hongjin and Zhu, Gao and Ji, Ge-Peng and Wilson, Nicholas and Yebra, Marta and Barnes, Nick}, title = {AusSmoke meets MultiNatSmoke: a fully-labelled diverse smoke segmentation dataset}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7996-8006} }
MVAT: Multi-View Aware Teacher for Weakly Supervised 3D Object Detection: Saad Lahlali,

Alexandre Fournier-Mongieux,

Nicolas Granger,

Hervé Le Borgne,

Quoc-Cuong Pham; [pdf] [supp]
[bibtex]
@InProceedings{Lahlali_2026_WACV, author = {Lahlali, Saad and Fournier-Mongieux, Alexandre and Granger, Nicolas and Le Borgne, Herv\'e and Pham, Quoc-Cuong}, title = {MVAT: Multi-View Aware Teacher for Weakly Supervised 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6101-6110} }
DreamCatcher: Efficient Multi-Concept Customization via Representation Finetuning: Jungwon Lee,

Changhun Lee,

Eunhyeok Park; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2026_WACV, author = {Lee, Jungwon and Lee, Changhun and Park, Eunhyeok}, title = {DreamCatcher: Efficient Multi-Concept Customization via Representation Finetuning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7062-7072} }
GorillaWatch: An Automated System for In-the-Wild Gorilla Re-Identification and Population Monitoring: Maximilian Schall,

Felix Leonard Knöfel,

Noah Elias König,

Jan Jonas Kubeler,

Maximilian von Klinski,

Joan Wilhelm Linnemann,

Xiaoshi Liu,

Iven Jelle Schlegelmilch,

Ole Woyciniuk,

Alexandra Schild,

Dante Wasmuht,

Magdalena Bermejo Espinet,

German Illera Basas,

Gerard de Melo; [pdf]
[bibtex]
@InProceedings{Schall_2026_WACV, author = {Schall, Maximilian and Kn\"ofel, Felix Leonard and K\"onig, Noah Elias and Kubeler, Jan Jonas and von Klinski, Maximilian and Linnemann, Joan Wilhelm and Liu, Xiaoshi and Schlegelmilch, Iven Jelle and Woyciniuk, Ole and Schild, Alexandra and Wasmuht, Dante and Espinet, Magdalena Bermejo and Basas, German Illera and de Melo, Gerard}, title = {GorillaWatch: An Automated System for In-the-Wild Gorilla Re-Identification and Population Monitoring}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8364-8375} }
CLoCKDistill: Consistent Location and Context aware Knowledge Distillation for DETRs: Qizhen Lan,

Qing Tian; [pdf] [arXiv]
[bibtex]
@InProceedings{Lan_2026_WACV, author = {Lan, Qizhen and Tian, Qing}, title = {CLoCKDistill: Consistent Location and Context aware Knowledge Distillation for DETRs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7188-7197} }
NAPP: Noise-Adaptive Prototype Perturbation for Few-Shot Learning: Ilhwan Kim,

Sangwoo Yun,

Dongheon Lee,

Seongsu Kim,

Joonki Paik; [pdf]
[bibtex]
@InProceedings{Kim_2026_WACV, author = {Kim, Ilhwan and Yun, Sangwoo and Lee, Dongheon and Kim, Seongsu and Paik, Joonki}, title = {NAPP: Noise-Adaptive Prototype Perturbation for Few-Shot Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8007-8016} }
MemeTAG: Keyword-Driven Meme Classification through Tag Embedding Reconstruction: Akshit Sharma,

Prashant W Patil; [pdf] [supp]
[bibtex]
@InProceedings{Sharma_2026_WACV, author = {Sharma, Akshit and Patil, Prashant W}, title = {MemeTAG: Keyword-Driven Meme Classification through Tag Embedding Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7679-7688} }
Hymavi : A Hybrid Mamba-Attention Network in Multi-View Framework for Volumetric Medical Image Segmentation: Sy Dat Tran,

Jin Kyu Gahm; [pdf]
[bibtex]
@InProceedings{Tran_2026_WACV, author = {Tran, Sy Dat and Gahm, Jin Kyu}, title = {Hymavi : A Hybrid Mamba-Attention Network in Multi-View Framework for Volumetric Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6006-6015} }
DocWaveDiff: A Predict-and-Refine approach for Document Image Enhancement with Wavelet U-Nets and Diffusion models: Matteo Marulli,

Marco Bertini; [pdf] [supp]
[bibtex]
@InProceedings{Marulli_2026_WACV, author = {Marulli, Matteo and Bertini, Marco}, title = {DocWaveDiff: A Predict-and-Refine approach for Document Image Enhancement with Wavelet U-Nets and Diffusion models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8511-8520} }
ODEt(ODEl): Shortcutting the Time and the Length in Diffusion and Flow Models for Faster Sampling: Denis Gudovskiy,

Wenzhao Zheng,

Tomoyuki Okuno,

Yohei Nakata,

Kurt Keutzer; [pdf] [supp]
[bibtex]
@InProceedings{Gudovskiy_2026_WACV, author = {Gudovskiy, Denis and Zheng, Wenzhao and Okuno, Tomoyuki and Nakata, Yohei and Keutzer, Kurt}, title = {ODEt(ODEl): Shortcutting the Time and the Length in Diffusion and Flow Models for Faster Sampling}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6111-6120} }
Can Image Splicing and Copy-Move Forgery Be Detected by the Same Model? Forensim: An Attention-Based State-Space Approach: Soumyaroop Nandi,

Prem Natarajan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nandi_2026_WACV, author = {Nandi, Soumyaroop and Natarajan, Prem}, title = {Can Image Splicing and Copy-Move Forgery Be Detected by the Same Model? Forensim: An Attention-Based State-Space Approach}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6194-6204} }
TopoRec: Point Cloud Recognition Using Topological Data Analysis: Anirban Ghosh,

Iliya Kulbaka,

Ian Dahlin,

Ayan Dutta; [pdf] [arXiv]
[bibtex]
@InProceedings{Ghosh_2026_WACV, author = {Ghosh, Anirban and Kulbaka, Iliya and Dahlin, Ian and Dutta, Ayan}, title = {TopoRec: Point Cloud Recognition Using Topological Data Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7544-7553} }
SFMNet: Sparse Focal Modulation for 3D Object Detection: Oren Shrout,

Ayellet Tal; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shrout_2026_WACV, author = {Shrout, Oren and Tal, Ayellet}, title = {SFMNet: Sparse Focal Modulation for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6287-6297} }
Multi-Grained Text-Guided Image Fusion for Multi-Exposure and Multi-Focus Scenarios: Mingwei Tang,

Jiahao Nie,

Guang Yang,

Ziqing Cui,

Jie Li; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tang_2026_WACV, author = {Tang, Mingwei and Nie, Jiahao and Yang, Guang and Cui, Ziqing and Li, Jie}, title = {Multi-Grained Text-Guided Image Fusion for Multi-Exposure and Multi-Focus Scenarios}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7668-7678} }
F-INR: Functional Tensor Decomposition for Implicit Neural Representations: Sai Karthikeya Vemuri,

Tim Büchner,

Joachim Denzler; [pdf] [supp]
[bibtex]
@InProceedings{Vemuri_2026_WACV, author = {Vemuri, Sai Karthikeya and B\"uchner, Tim and Denzler, Joachim}, title = {F-INR: Functional Tensor Decomposition for Implicit Neural Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6557-6568} }
Understanding the Visual Projection Space of Multimodal LLMs: Sungheon Jeong,

Yoojeong Song,

Hyungjoon Kim; [pdf]
[bibtex]
@InProceedings{Jeong_2026_WACV, author = {Jeong, Sungheon and Song, Yoojeong and Kim, Hyungjoon}, title = {Understanding the Visual Projection Space of Multimodal LLMs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6049-6058} }
Flood-LDM: Generalizable Latent Diffusion Models for rapid and accurate zero-shot High-Resolution Flood Mapping: Sun Han Neo,

Sachith Seneviratne,

Herath Mudiyanselage Viraj Vidura Herath,

Abhishek Saha,

Sanka Rasnayaka,

Lucy Amanda Marshall; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Neo_2026_WACV, author = {Neo, Sun Han and Seneviratne, Sachith and Herath, Herath Mudiyanselage Viraj Vidura and Saha, Abhishek and Rasnayaka, Sanka and Marshall, Lucy Amanda}, title = {Flood-LDM: Generalizable Latent Diffusion Models for rapid and accurate zero-shot High-Resolution Flood Mapping}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8063-8072} }
PerVL-Bench: Benchmarking Multimodal Personalization for Large Vision-Language Models: Minsung Kim; [pdf] [supp]
[bibtex]
@InProceedings{Kim_2026_WACV, author = {Kim, Minsung}, title = {PerVL-Bench: Benchmarking Multimodal Personalization for Large Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6696-6704} }
OSEG: Improving Diffusion sampling through Orthogonal Smoothed Energy Guidance: Masud An Nur Islam Fahim,

Nazmus Saqib,

Joon-Min Gil; [pdf] [supp]
[bibtex]
@InProceedings{Fahim_2026_WACV, author = {Fahim, Masud An Nur Islam and Saqib, Nazmus and Gil, Joon-Min}, title = {OSEG: Improving Diffusion sampling through Orthogonal Smoothed Energy Guidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5996-6005} }
Motion-Aware Graph Fusion Network for 3D Human Pose Estimation: Yen Pham,

Xiaohui Yuan,

Chengyuan Zhuang; [pdf] [supp]
[bibtex]
@InProceedings{Pham_2026_WACV, author = {Pham, Yen and Yuan, Xiaohui and Zhuang, Chengyuan}, title = {Motion-Aware Graph Fusion Network for 3D Human Pose Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5798-5808} }
Graph Query Networks for Object Detection with Automotive Radar: Loveneet Saini,

Hasan Tercan,

Tobias Meisen; [pdf] [arXiv]
[bibtex]
@InProceedings{Saini_2026_WACV, author = {Saini, Loveneet and Tercan, Hasan and Meisen, Tobias}, title = {Graph Query Networks for Object Detection with Automotive Radar}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6988-6997} }
GroupPortrait: Multi-ID Portrait Generation with High Identity Preservation and Fine-Grained Control: Meijia Huang,

Ruida Li,

Bing Ma,

Liangwei Jiang,

Shuo Fang,

Chenguang Ma; [pdf] [supp]
[bibtex]
@InProceedings{Huang_2026_WACV, author = {Huang, Meijia and Li, Ruida and Ma, Bing and Jiang, Liangwei and Fang, Shuo and Ma, Chenguang}, title = {GroupPortrait: Multi-ID Portrait Generation with High Identity Preservation and Fine-Grained Control}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6226-6235} }
FAIR-SIGHT: Fairness Assurance in Image Recognition via Simultaneous Conformal Thresholding and Dynamic Output Repair: Arya Fayyazi,

Mehdi Kamal,

Massoud Pedram; [pdf] [arXiv]
[bibtex]
@InProceedings{Fayyazi_2026_WACV, author = {Fayyazi, Arya and Kamal, Mehdi and Pedram, Massoud}, title = {FAIR-SIGHT: Fairness Assurance in Image Recognition via Simultaneous Conformal Thresholding and Dynamic Output Repair}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6633-6642} }
T2LF: LLM-Guided Multimodal Diffusion for Text-to-Light Field Synthesis: Soyoung Yoon,

Namhyuk Ahn,

In Kyu Park; [pdf] [supp]
[bibtex]
@InProceedings{Yoon_2026_WACV, author = {Yoon, Soyoung and Ahn, Namhyuk and Park, In Kyu}, title = {T2LF: LLM-Guided Multimodal Diffusion for Text-to-Light Field Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7322-7332} }
Training-free Conditional Image Embedding Framework Leveraging Large Vision Language Models: Masayuki Kawarada,

Kosuke Yamada,

Antonio Tejero-de-Pablos,

Naoto Inoue; [pdf] [supp]
[bibtex]
@InProceedings{Kawarada_2026_WACV, author = {Kawarada, Masayuki and Yamada, Kosuke and Tejero-de-Pablos, Antonio and Inoue, Naoto}, title = {Training-free Conditional Image Embedding Framework Leveraging Large Vision Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7636-7646} }
General and Domain-Specific Zero-shot Detection of Generated Images via Conditional Likelihood: Roy Betser,

Omer Hofman,

Roman Vainshtein,

Guy Gilboa; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Betser_2026_WACV, author = {Betser, Roy and Hofman, Omer and Vainshtein, Roman and Gilboa, Guy}, title = {General and Domain-Specific Zero-shot Detection of Generated Images via Conditional Likelihood}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7809-7820} }
MM-TS: Multi-Modal Temperature and Margin Schedules for Contrastive Learning with Long-Tail Data: Siarhei Sheludzko,

Dhimitrios Duka,

Bernt Schiele,

Hilde Kuehne,

Anna Kukleva; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sheludzko_2026_WACV, author = {Sheludzko, Siarhei and Duka, Dhimitrios and Schiele, Bernt and Kuehne, Hilde and Kukleva, Anna}, title = {MM-TS: Multi-Modal Temperature and Margin Schedules for Contrastive Learning with Long-Tail Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7376-7386} }
VitaGlyph: Vitalizing Artistic Typography with Flexible Dual-branch Diffusion Models: Kailai Feng,

Yabo Zhang,

Haodong Yu,

Zhilong Ji,

Jinfeng Bai,

Hongzhi Zhang,

Wangmeng Zuo; [pdf] [arXiv]
[bibtex]
@InProceedings{Feng_2026_WACV, author = {Feng, Kailai and Zhang, Yabo and Yu, Haodong and Ji, Zhilong and Bai, Jinfeng and Zhang, Hongzhi and Zuo, Wangmeng}, title = {VitaGlyph: Vitalizing Artistic Typography with Flexible Dual-branch Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8220-8230} }
GHOST: Getting to the Bottom of Hallucinations with A Multi-round Consistency Benchmark: Vibashan VS,

Nadine Chang,

Jenny Schmalfuss,

Vishal M. Patel,

Zhiding Yu,

Jose M. Alvarez; [pdf] [supp]
[bibtex]
@InProceedings{VS_2026_WACV, author = {VS, Vibashan and Chang, Nadine and Schmalfuss, Jenny and Patel, Vishal M. and Yu, Zhiding and Alvarez, Jose M.}, title = {GHOST: Getting to the Bottom of Hallucinations with A Multi-round Consistency Benchmark}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6163-6173} }
Optimizing against Infeasible Inclusions from Data for Semantic Segmentation through Morphology: Shamik Basu,

Luc Van Gool,

Christos Sakaridis; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Basu_2026_WACV, author = {Basu, Shamik and Van Gool, Luc and Sakaridis, Christos}, title = {Optimizing against Infeasible Inclusions from Data for Semantic Segmentation through Morphology}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7524-7533} }
Zero-Shot Audio-Visual Editing via Cross-Modal Delta Denoising: Yan-Bo Lin,

Kevin Lin,

Zhengyuan Yang,

Linjie Li,

Jianfeng Wang,

Chung-Ching Lin,

Xiaofei Wang,

Gedas Bertasius,

Lijuan Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2026_WACV, author = {Lin, Yan-Bo and Lin, Kevin and Yang, Zhengyuan and Li, Linjie and Wang, Jianfeng and Lin, Chung-Ching and Wang, Xiaofei and Bertasius, Gedas and Wang, Lijuan}, title = {Zero-Shot Audio-Visual Editing via Cross-Modal Delta Denoising}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7344-7354} }
D2Mamba: Dual Domain Guided Informed Search in State Space Model for Underwater Image Enhancement: Alik Pramanick,

Soumajit Roy,

Arijit Sur; [pdf] [supp]
[bibtex]
@InProceedings{Pramanick_2026_WACV, author = {Pramanick, Alik and Roy, Soumajit and Sur, Arijit}, title = {D2Mamba: Dual Domain Guided Informed Search in State Space Model for Underwater Image Enhancement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7126-7136} }
TM-Adapter: Temporal Merge Adapter for Efficient Global Temporal Modeling: Woo Joo Hahm,

Seungwoo Jang,

Hyeon Tak Kim,

Daeun Lee,

Kwangsu Kim; [pdf] [supp]
[bibtex]
@InProceedings{Hahm_2026_WACV, author = {Hahm, Woo Joo and Jang, Seungwoo and Kim, Hyeon Tak and Lee, Daeun and Kim, Kwangsu}, title = {TM-Adapter: Temporal Merge Adapter for Efficient Global Temporal Modeling}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6121-6131} }
Guiding What Not to Generate: Automated Negative Prompting for Text-Image Alignment: Sangha Park,

Eunji Kim,

Yeongtak Oh,

Jooyoung Choi,

Sungroh Yoon; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2026_WACV, author = {Park, Sangha and Kim, Eunji and Oh, Yeongtak and Choi, Jooyoung and Yoon, Sungroh}, title = {Guiding What Not to Generate: Automated Negative Prompting for Text-Image Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6664-6675} }
LASER: Lip Landmark Assisted Speaker Detection for Robustness: Le Thien Phuc Nguyen,

Zhuoran Yu,

Yong Jae Lee; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Le Thien Phuc and Yu, Zhuoran and Lee, Yong Jae}, title = {LASER: Lip Landmark Assisted Speaker Detection for Robustness}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7291-7300} }
SpecGen: Neural Spectral BRDF Generation via Spectral-Spatial Tri-plane Aggregation: Zhenyu Jin,

Wenjie Li,

Zhanyu Ma,

Heng Guo; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Jin_2026_WACV, author = {Jin, Zhenyu and Li, Wenjie and Ma, Zhanyu and Guo, Heng}, title = {SpecGen: Neural Spectral BRDF Generation via Spectral-Spatial Tri-plane Aggregation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8323-8332} }
A Unified Diffusion-Based Framework for Multi-Agent Trajectory Prediction Integrating Structured Multi-Modal Representations: Chenxi Yang,

Suyang Xi,

Hong Ding,

Yiqing Shen,

Yunhao Liu; [pdf]
[bibtex]
@InProceedings{Yang_2026_WACV, author = {Yang, Chenxi and Xi, Suyang and Ding, Hong and Shen, Yiqing and Liu, Yunhao}, title = {A Unified Diffusion-Based Framework for Multi-Agent Trajectory Prediction Integrating Structured Multi-Modal Representations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6442-6452} }
IMPACT: Interpretable Most Important Person Analysis and Classification using Transformer-based Models: Akshat Rampuria,

Kamakshya Prasad Nayak,

Kamalakar Vijay Thakare,

Tushar Joshi,

Aditya Dhananjay Singh,

Haesol Park,

Heeseung Choi,

Debi Prosad Dogra,

Ig-Jae Kim; [pdf] [supp]
[bibtex]
@InProceedings{Rampuria_2026_WACV, author = {Rampuria, Akshat and Nayak, Kamakshya Prasad and Thakare, Kamalakar Vijay and Joshi, Tushar and Singh, Aditya Dhananjay and Park, Haesol and Choi, Heeseung and Dogra, Debi Prosad and Kim, Ig-Jae}, title = {IMPACT: Interpretable Most Important Person Analysis and Classification using Transformer-based Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8179-8187} }
HOLO: Holistic Lightweight Optimization for Scene Understanding with Auto-Annotation and Multimodal Learning: Xiaoyun Hu,

Xiaohan Yan,

Nan Wang,

Gang Wei,

Zhicheng Wang; [pdf] [supp]
[bibtex]
@InProceedings{Hu_2026_WACV, author = {Hu, Xiaoyun and Yan, Xiaohan and Wang, Nan and Wei, Gang and Wang, Zhicheng}, title = {HOLO: Holistic Lightweight Optimization for Scene Understanding with Auto-Annotation and Multimodal Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7719-7729} }
UniVid: Unifying Vision Tasks with Pre-trained Video Generation Models: Lan Chen,

Yuchao Gu,

Qi Mao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2026_WACV, author = {Chen, Lan and Gu, Yuchao and Mao, Qi}, title = {UniVid: Unifying Vision Tasks with Pre-trained Video Generation Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6754-6763} }
MedPEFT-CL: Dual-Phase Parameter-Efficient Continual Learning with Medical Semantic Adapter and Bidirectional Memory Consolidation: Ziyuan Gao,

Philippe Morel; [pdf]
[bibtex]
@InProceedings{Gao_2026_WACV, author = {Gao, Ziyuan and Morel, Philippe}, title = {MedPEFT-CL: Dual-Phase Parameter-Efficient Continual Learning with Medical Semantic Adapter and Bidirectional Memory Consolidation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7699-7708} }
ZebraPose: Zebra Detection and Pose Estimation using only Synthetic Data: Elia Bonetto,

Aamir Ahmad; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bonetto_2026_WACV, author = {Bonetto, Elia and Ahmad, Aamir}, title = {ZebraPose: Zebra Detection and Pose Estimation using only Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6611-6620} }
DM3Net: Dual-Camera Super-Resolution via Domain Modulation and Multi-scale Matching: Cong Guan,

Jiacheng Ying,

Yuya Ieiri,

Osamu Yoshie; [pdf] [supp]
[bibtex]
@InProceedings{Guan_2026_WACV, author = {Guan, Cong and Ying, Jiacheng and Ieiri, Yuya and Yoshie, Osamu}, title = {DM3Net: Dual-Camera Super-Resolution via Domain Modulation and Multi-scale Matching}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7472-7481} }
Distilling What and Why: Enhancing Driver Intention Prediction with MLLMs: Sainithin Artham,

Avijit Dasgupta,

Shankar Gangisetty,

C.V. Jawahar; [pdf] [supp]
[bibtex]
@InProceedings{Artham_2026_WACV, author = {Artham, Sainithin and Dasgupta, Avijit and Gangisetty, Shankar and Jawahar, C.V.}, title = {Distilling What and Why: Enhancing Driver Intention Prediction with MLLMs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7281-7290} }
Diffusion-Based Action Recognition Generalizes to Untrained Domains: Rogério Guimarães,

Frank Xiao,

Pietro Perona,

Markus Marks; [pdf] [supp]
[bibtex]
@InProceedings{Guimaraes_2026_WACV, author = {Guimar\~aes, Rog\'erio and Xiao, Frank and Perona, Pietro and Marks, Markus}, title = {Diffusion-Based Action Recognition Generalizes to Untrained Domains}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5919-5933} }
EVTP-IVS: Effective Visual Token Pruning For Unifying Instruction Visual Segmentation In Multi-Modal Large Language Models: Wenhui Zhu,

Xiwen Chen,

Zhipeng Wang,

Shao Tang,

Sayan Ghosh,

Xuanzhao Dong,

Rajat Koner,

Yalin Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhu_2026_WACV, author = {Zhu, Wenhui and Chen, Xiwen and Wang, Zhipeng and Tang, Shao and Ghosh, Sayan and Dong, Xuanzhao and Koner, Rajat and Wang, Yalin}, title = {EVTP-IVS: Effective Visual Token Pruning For Unifying Instruction Visual Segmentation In Multi-Modal Large Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7158-7167} }
ReFineVQA: Iterative Refinement of Video Description via Feedback Generation for Video Question Answering: Jeongwan Shin,

Chan Hur,

Seongmin Cho,

Jaeho Choi,

Hyeyoung Park; [pdf] [supp]
[bibtex]
@InProceedings{Shin_2026_WACV, author = {Shin, Jeongwan and Hur, Chan and Cho, Seongmin and Choi, Jaeho and Park, Hyeyoung}, title = {ReFineVQA: Iterative Refinement of Video Description via Feedback Generation for Video Question Answering}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7647-7657} }
DUDA: Distilled Unsupervised Domain Adaptation for Lightweight Semantic Segmentation: Beomseok Kang,

Niluthpol Chowdhury Mithun,

Abhinav Rajvanshi,

Han-Pang Chiu,

Supun Samarasekera; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kang_2026_WACV, author = {Kang, Beomseok and Mithun, Niluthpol Chowdhury and Rajvanshi, Abhinav and Chiu, Han-Pang and Samarasekera, Supun}, title = {DUDA: Distilled Unsupervised Domain Adaptation for Lightweight Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8124-8135} }
OPFormer: Object Pose Estimation Leveraging Foundation Model with Geometric Encoding: Artem Moroz,

Vít Zeman,

Martin Mikšík,

Elizaveta Isianova,

Miroslav David,

Pavel Burget,

Varun Burde; [pdf] [supp]
[bibtex]
@InProceedings{Moroz_2026_WACV, author = {Moroz, Artem and Zeman, V{\'\i}t and Mik\v{s}{\'\i}k, Martin and Isianova, Elizaveta and David, Miroslav and Burget, Pavel and Burde, Varun}, title = {OPFormer: Object Pose Estimation Leveraging Foundation Model with Geometric Encoding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6621-6632} }
Enhancing Reverse Distillation with Core Exemplar Learning for Unified Multi-Class Anomaly Detection: Heechul Lim,

Min-Soo Kim,

Hyun-Boo Lee,

Suk-Ju Kang,

Kang-Wook Chon,

Haeyun Lee; [pdf]
[bibtex]
@InProceedings{Lim_2026_WACV, author = {Lim, Heechul and Kim, Min-Soo and Lee, Hyun-Boo and Kang, Suk-Ju and Chon, Kang-Wook and Lee, Haeyun}, title = {Enhancing Reverse Distillation with Core Exemplar Learning for Unified Multi-Class Anomaly Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7586-7595} }
Joint Optimization of Camera Model and Deep Neural Network for Image Recognition: Youta Noboru,

Yuko Ozasa,

Masayuki Tanaka; [pdf] [supp]
[bibtex]
@InProceedings{Noboru_2026_WACV, author = {Noboru, Youta and Ozasa, Yuko and Tanaka, Masayuki}, title = {Joint Optimization of Camera Model and Deep Neural Network for Image Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7626-7635} }
DirectDrag: High-Fidelity, Mask-Free, Prompt-Free Drag-based Image Editing via Readout-Guided Feature Alignment: Sheng-Hao Liao,

Shang-Fu Chen,

Tai-Ming Huang,

Wen-Huang Cheng,

Kai-Lung Hua; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Liao_2026_WACV, author = {Liao, Sheng-Hao and Chen, Shang-Fu and Huang, Tai-Ming and Cheng, Wen-Huang and Hua, Kai-Lung}, title = {DirectDrag: High-Fidelity, Mask-Free, Prompt-Free Drag-based Image Editing via Readout-Guided Feature Alignment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8252-8261} }
Single-step Diffusion for Image Compression at Ultra-Low Bitrates: Chanung Park,

Joo Chan Lee,

Jong Hwan Ko; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2026_WACV, author = {Park, Chanung and Lee, Joo Chan and Ko, Jong Hwan}, title = {Single-step Diffusion for Image Compression at Ultra-Low Bitrates}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6391-6400} }
TED-4DGS: Temporally Activated and Embedding-based Deformation for 4DGS Compression: Cheng-Yuan Ho,

He-Bi Yang,

Jui-Chiu Chiang,

Yu-Lun Liu,

Wen-Hsiao Peng; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ho_2026_WACV, author = {Ho, Cheng-Yuan and Yang, He-Bi and Chiang, Jui-Chiu and Liu, Yu-Lun and Peng, Wen-Hsiao}, title = {TED-4DGS: Temporally Activated and Embedding-based Deformation for 4DGS Compression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6371-6380} }
View-aware Cross-modal Distillation for Multi-view Action Recognition: Trung Thanh Nguyen,

Yasutomo Kawanishi,

Vijay John,

Takahiro Komamizu,

Ichiro Ide; [pdf] [arXiv]
[bibtex]
@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Trung Thanh and Kawanishi, Yasutomo and John, Vijay and Komamizu, Takahiro and Ide, Ichiro}, title = {View-aware Cross-modal Distillation for Multi-view Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7769-7778} }
FedEFC: Federated Learning Using Enhanced Forward Correction Against Noisy Labels: Seunghun Yu,

Jin-Hyun Ahn,

Joonhyuk Kang; [pdf] [arXiv]
[bibtex]
@InProceedings{Yu_2026_WACV, author = {Yu, Seunghun and Ahn, Jin-Hyun and Kang, Joonhyuk}, title = {FedEFC: Federated Learning Using Enhanced Forward Correction Against Noisy Labels}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8094-8102} }
LogicCBMs: Logic-Enhanced Concept-Based Learning: Deepika SN Vemuri,

Gautham Bellamkonda,

Aditya Pola,

Vineeth N Balasubramanian; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Vemuri_2026_WACV, author = {Vemuri, Deepika SN and Bellamkonda, Gautham and Pola, Aditya and Balasubramanian, Vineeth N}, title = {LogicCBMs: Logic-Enhanced Concept-Based Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6039-6048} }
FNOPT: Resolution-Agnostic, Self-Supervised Cloth Simulation using Meta-Optimization with Fourier Neural Operators: Ruochen Chen,

Thuy Tran,

Shaifali Parashar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2026_WACV, author = {Chen, Ruochen and Tran, Thuy and Parashar, Shaifali}, title = {FNOPT: Resolution-Agnostic, Self-Supervised Cloth Simulation using Meta-Optimization with Fourier Neural Operators}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7116-7125} }
Diversity Preserving Coresets for Image Quality Assessment: Arpita Nema,

Hanwei Zhu,

Xi Zhang,

Weisi Lin; [pdf] [supp]
[bibtex]
@InProceedings{Nema_2026_WACV, author = {Nema, Arpita and Zhu, Hanwei and Zhang, Xi and Lin, Weisi}, title = {Diversity Preserving Coresets for Image Quality Assessment}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7925-7934} }
RoadBench: A Vision-Language Foundation Model and Benchmark for Road Damage Understanding: Xi Xiao,

Yunbei Zhang,

Janet Wang,

Lin Zhao,

Yuxiang Wei,

Hengjia Li,

Yanshu Li,

Xiao Wang,

Swalpa Kumar Roy,

Hao Xu,

Tianyang Wang; [pdf] [arXiv]
[bibtex]
@InProceedings{Xiao_2026_WACV, author = {Xiao, Xi and Zhang, Yunbei and Wang, Janet and Zhao, Lin and Wei, Yuxiang and Li, Hengjia and Li, Yanshu and Wang, Xiao and Roy, Swalpa Kumar and Xu, Hao and Wang, Tianyang}, title = {RoadBench: A Vision-Language Foundation Model and Benchmark for Road Damage Understanding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6016-6026} }
Optimization-Free Style Transfer for 3D Gaussian Splats: Raphael Du Sablon,

David Hart; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Du_Sablon_2026_WACV, author = {Du Sablon, Raphael and Hart, David}, title = {Optimization-Free Style Transfer for 3D Gaussian Splats}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8041-8051} }
From Cognitive Priors to Instance Semantics: A Unified Framework for Multi-task Affective Computing: Guanyu Hu,

Dimitrios Kollias,

Xinyu Yang; [pdf]
[bibtex]
@InProceedings{Hu_2026_WACV, author = {Hu, Guanyu and Kollias, Dimitrios and Yang, Xinyu}, title = {From Cognitive Priors to Instance Semantics: A Unified Framework for Multi-task Affective Computing}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8551-8562} }
PoseAdapt: Sustainable Human Pose Estimation via Continual Learning Benchmarks and Toolkit: Muhammad Saif Ullah Khan,

Didier Stricker; [pdf] [arXiv]
[bibtex]
@InProceedings{Khan_2026_WACV, author = {Khan, Muhammad Saif Ullah and Stricker, Didier}, title = {PoseAdapt: Sustainable Human Pose Estimation via Continual Learning Benchmarks and Toolkit}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6840-6850} }
Cycle-Consistent Multi-Graph Matching for Self-Supervised Annotation of C. Elegans: Sebastian Stricker,

Christoph Karg,

Lisa Hutschenreiter,

Bogdan Savchynskyy,

Dagmar Kainmueller; [pdf] [supp]
[bibtex]
@InProceedings{Stricker_2026_WACV, author = {Stricker, Sebastian and Karg, Christoph and Hutschenreiter, Lisa and Savchynskyy, Bogdan and Kainmueller, Dagmar}, title = {Cycle-Consistent Multi-Graph Matching for Self-Supervised Annotation of C. Elegans}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7208-7217} }
Locally Explaining Prediction Behavior via Gradual Interventions and Measuring Property Gradients: Niklas Penzel,

Joachim Denzler; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Penzel_2026_WACV, author = {Penzel, Niklas and Denzler, Joachim}, title = {Locally Explaining Prediction Behavior via Gradual Interventions and Measuring Property Gradients}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7398-7408} }
Scalable Video Action Anticipation with Cross Linear Attentive Memory: Zeyun Zhong,

Manuel Martin,

David Schneider,

David J. Lerch,

Chengzhi Wu,

Frederik Diederichs,

Juergen Gall,

Jürgen Beyerer; [pdf] [supp]
[bibtex]
@InProceedings{Zhong_2026_WACV, author = {Zhong, Zeyun and Martin, Manuel and Schneider, David and Lerch, David J. and Wu, Chengzhi and Diederichs, Frederik and Gall, Juergen and Beyerer, J\"urgen}, title = {Scalable Video Action Anticipation with Cross Linear Attentive Memory}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8113-8123} }
FairVLM: Enhancing Fairness and Prompt Sensitivity in Vision Language Models for Medical Image Segmentation: Md Motiur Rahman,

Saeka Rahman,

Smriti Bhatt,

Miad Faezipour; [pdf] [supp]
[bibtex]
@InProceedings{Rahman_2026_WACV, author = {Rahman, Md Motiur and Rahman, Saeka and Bhatt, Smriti and Faezipour, Miad}, title = {FairVLM: Enhancing Fairness and Prompt Sensitivity in Vision Language Models for Medical Image Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7450-7460} }
NRGMark: Localized Watermarking for Energy Transparency in Images: Shruti Agarwal,

Élie Michel,

Vishal Asnani,

Tania Mathern,

John Collomosse; [pdf]
[bibtex]
@InProceedings{Agarwal_2026_WACV, author = {Agarwal, Shruti and Michel, \'Elie and Asnani, Vishal and Mathern, Tania and Collomosse, John}, title = {NRGMark: Localized Watermarking for Energy Transparency in Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7779-7788} }
V2XScene: Multi-View Consistent 3D Scene Simulation for Collaborative Perception: Yanfei Li,

Yi Gong,

Yuan Zeng; [pdf]
[bibtex]
@InProceedings{Li_2026_WACV, author = {Li, Yanfei and Gong, Yi and Zeng, Yuan}, title = {V2XScene: Multi-View Consistent 3D Scene Simulation for Collaborative Perception}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6569-6579} }
Advancing Multimodal LLMs by Large-Scale 3D Visual Instruction Dataset Generation: Liu He,

Xiao Zeng,

Yizhi Song,

Albert Y. C. Chen,

Lu Xia,

Shashwat Verma,

Sankalp Dayal,

Min Sun,

Cheng-Hao Kuo,

Daniel Aliaga; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{He_2026_WACV, author = {He, Liu and Zeng, Xiao and Song, Yizhi and Chen, Albert Y. C. and Xia, Lu and Verma, Shashwat and Dayal, Sankalp and Sun, Min and Kuo, Cheng-Hao and Aliaga, Daniel}, title = {Advancing Multimodal LLMs by Large-Scale 3D Visual Instruction Dataset Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5886-5897} }
Test-Time Adaptation for Video Highlight Detection Using Meta-Auxiliary Learning and Cross-Modality Hallucinations: Zahidul Islam,

Sujoy Paul,

Mrigank Rochan; [pdf] [arXiv]
[bibtex]
@InProceedings{Islam_2026_WACV, author = {Islam, Zahidul and Paul, Sujoy and Rochan, Mrigank}, title = {Test-Time Adaptation for Video Highlight Detection Using Meta-Auxiliary Learning and Cross-Modality Hallucinations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6893-6902} }
Stabilizing Direct Training of Spiking Neural Networks: Membrane Potential Initialization and Threshold-robust Surrogate Gradient: Hyunho Kook,

Byeongho Yu,

Jeong Min Oh,

Eunhyeok Park; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kook_2026_WACV, author = {Kook, Hyunho and Yu, Byeongho and Oh, Jeong Min and Park, Eunhyeok}, title = {Stabilizing Direct Training of Spiking Neural Networks: Membrane Potential Initialization and Threshold-robust Surrogate Gradient}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8500-8510} }
SphereEdit: Spherical Semantic Editing in Diffusion Models: Salamata Konate,

Hassan Hamidi,

Elham Dolatabadi,

Frank Rudzicz,

Laleh Seyyed-Kalantari; [pdf] [supp]
[bibtex]
@InProceedings{Konate_2026_WACV, author = {Konate, Salamata and Hamidi, Hassan and Dolatabadi, Elham and Rudzicz, Frank and Seyyed-Kalantari, Laleh}, title = {SphereEdit: Spherical Semantic Editing in Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8084-8093} }
S2O: Static to Openable Enhancement for Articulated 3D Objects: Denys Iliash,

Hanxiao Jiang,

Yiming Zhang,

Manolis Savva,

Angel X. Chang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Iliash_2026_WACV, author = {Iliash, Denys and Jiang, Hanxiao and Zhang, Yiming and Savva, Manolis and Chang, Angel X.}, title = {S2O: Static to Openable Enhancement for Articulated 3D Objects}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6785-6795} }
UniGaze: Towards Universal Gaze Estimation via Large-scale Pre-Training: Jiawei Qin,

Xucong Zhang,

Yusuke Sugano; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Qin_2026_WACV, author = {Qin, Jiawei and Zhang, Xucong and Sugano, Yusuke}, title = {UniGaze: Towards Universal Gaze Estimation via Large-scale Pre-Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5809-5820} }
Splatter Layout: Geometry-embedded 3D Reconstruction via Surface Unfolding: Bryan Heryanto,

Tackgeun You,

Chanwoo Kim,

Hwasup Lim; [pdf] [supp]
[bibtex]
@InProceedings{Heryanto_2026_WACV, author = {Heryanto, Bryan and You, Tackgeun and Kim, Chanwoo and Lim, Hwasup}, title = {Splatter Layout: Geometry-embedded 3D Reconstruction via Surface Unfolding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7709-7718} }
Optimal Transport for Rectified Flow Image Editing: Unifying Inversion-Based and Direct Methods: Marian Lupaşcu,

Mihai Sorin Stupariu; [pdf] [supp]
[bibtex]
@InProceedings{Lupascu_2026_WACV, author = {Lupa\c{s}cu, Marian and Stupariu, Mihai Sorin}, title = {Optimal Transport for Rectified Flow Image Editing: Unifying Inversion-Based and Direct Methods}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6764-6774} }
ICONIC-444: A 3.1-Million-Image Dataset for OOD Detection Research: Gerhard Krumpl,

Henning Avenhaus,

Horst Possegger; [pdf] [supp]
[bibtex]
@InProceedings{Krumpl_2026_WACV, author = {Krumpl, Gerhard and Avenhaus, Henning and Possegger, Horst}, title = {ICONIC-444: A 3.1-Million-Image Dataset for OOD Detection Research}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8427-8436} }
FuLLaMa: Training-free Diffusion-based Object Removal with Context Preservation: Ilke Demir,

Umur Aybars Ciftci; [pdf] [supp]
[bibtex]
@InProceedings{Demir_2026_WACV, author = {Demir, Ilke and Ciftci, Umur Aybars}, title = {FuLLaMa: Training-free Diffusion-based Object Removal with Context Preservation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8563-8573} }
Where is the Watermark? Interpretable Watermark Detection at the Block Level: Maria Bulychev,

Neil G. Marchant,

Benjamin I. P. Rubinstein; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bulychev_2026_WACV, author = {Bulychev, Maria and Marchant, Neil G. and Rubinstein, Benjamin I. P.}, title = {Where is the Watermark? Interpretable Watermark Detection at the Block Level}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7420-7429} }
HABIT: Human Action Benchmark for Interactive Traffic in CARLA: Mohan Ramesh,

Mark Azer,

Fabian Flohr; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ramesh_2026_WACV, author = {Ramesh, Mohan and Azer, Mark and Flohr, Fabian}, title = {HABIT: Human Action Benchmark for Interactive Traffic in CARLA}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7148-7157} }
Patch Your Matcher: Correspondence-Aware Image-to-Image Translation Unlocks Cross-Modal Matching via Single-Modality Priors: Anton Frolov,

Volker Rodehorst; [pdf] [supp]
[bibtex]
@InProceedings{Frolov_2026_WACV, author = {Frolov, Anton and Rodehorst, Volker}, title = {Patch Your Matcher: Correspondence-Aware Image-to-Image Translation Unlocks Cross-Modal Matching via Single-Modality Priors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7913-7924} }
A Deep Network for Object Detection on Inland Waters: Dennis Griesser,

Bastian Goldluecke,

Matthias O. Franz,

Georg Umlauf; [pdf] [supp]
[bibtex]
@InProceedings{Griesser_2026_WACV, author = {Griesser, Dennis and Goldluecke, Bastian and Franz, Matthias O. and Umlauf, Georg}, title = {A Deep Network for Object Detection on Inland Waters}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6590-6599} }
Logit-Adjusted Test-Time Adaptation under Partial Class Imbalance: Thilina Weerasinghe,

Ruwan Tennakoon,

WeiQin Chuah,

Alireza Bab-Hadiashar; [pdf] [supp]
[bibtex]
@InProceedings{Weerasinghe_2026_WACV, author = {Weerasinghe, Thilina and Tennakoon, Ruwan and Chuah, WeiQin and Bab-Hadiashar, Alireza}, title = {Logit-Adjusted Test-Time Adaptation under Partial Class Imbalance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5977-5985} }
AuthGuard: Generalizable Deepfake Detection via Language Guidance: Guangyu Shen,

Zhihua Li,

Xiang Xu,

Tianchen Zhao,

Zheng Zhang,

Dongsheng An,

Zhuowen Tu,

Yifan Xing,

Qin Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Shen_2026_WACV, author = {Shen, Guangyu and Li, Zhihua and Xu, Xiang and Zhao, Tianchen and Zhang, Zheng and An, Dongsheng and Tu, Zhuowen and Xing, Yifan and Zhang, Qin}, title = {AuthGuard: Generalizable Deepfake Detection via Language Guidance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6215-6225} }
VIZOR: Viewpoint-Invariant Zero-Shot Scene Graph Generation for 3D Scene Reasoning: Vivek Madhavaram,

Vartika Sengar,

Arkadipta De,

Charu Sharma; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Madhavaram_2026_WACV, author = {Madhavaram, Vivek and Sengar, Vartika and De, Arkadipta and Sharma, Charu}, title = {VIZOR: Viewpoint-Invariant Zero-Shot Scene Graph Generation for 3D Scene Reasoning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8584-8595} }
Gaussian Splatting Map Registration with Orthographic Bird's-Eye-View Renderings: H. Leblond,

G. Simon,

R. Martins,

C. Demonceaux,

M.-O. Berger; [pdf] [supp]
[bibtex]
@InProceedings{Leblond_2026_WACV, author = {Leblond, H. and Simon, G. and Martins, R. and Demonceaux, C. and Berger, M.-O.}, title = {Gaussian Splatting Map Registration with Orthographic Bird's-Eye-View Renderings}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6080-6089} }
IPCD: Intrinsic Point-Cloud Decomposition: Shogo Sato,

Takuhiro Kaneko,

Shoichiro Takeda,

Tomoyasu Shimada,

Kazuhiko Murasaki,

Taiga Yoshida,

Ryuichi Tanida,

Akisato Kimura; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sato_2026_WACV, author = {Sato, Shogo and Kaneko, Takuhiro and Takeda, Shoichiro and Shimada, Tomoyasu and Murasaki, Kazuhiko and Yoshida, Taiga and Tanida, Ryuichi and Kimura, Akisato}, title = {IPCD: Intrinsic Point-Cloud Decomposition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7094-7103} }
Diffusion Noise Optimization for Synthetic VLM Training: Ren Ohkubo,

Rintaro Yanagi,

Hirokatsu Kataoka,

Yutaka Satoh; [pdf] [supp]
[bibtex]
@InProceedings{Ohkubo_2026_WACV, author = {Ohkubo, Ren and Yanagi, Rintaro and Kataoka, Hirokatsu and Satoh, Yutaka}, title = {Diffusion Noise Optimization for Synthetic VLM Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6412-6421} }
TacticalCalib: End-to-End 6-DoF Camera Pose Regression for Tactical Camera Calibration: Liang Fan,

Xiaoqian Liu,

Zhi Chen,

Lingkai Yang; [pdf]
[bibtex]
@InProceedings{Fan_2026_WACV, author = {Fan, Liang and Liu, Xiaoqian and Chen, Zhi and Yang, Lingkai}, title = {TacticalCalib: End-to-End 6-DoF Camera Pose Regression for Tactical Camera Calibration}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6547-6556} }
FlowCLAS: Enhancing Normalizing Flow-Based Anomaly Segmentation Via Contrastive Learning: Chang Won Lee,

Selina Leveugle,

Paul Grouchy,

Chris Langley,

Svetlana Stolpner,

Jonathan Kelly,

Steven L. Waslander; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2026_WACV, author = {Lee, Chang Won and Leveugle, Selina and Grouchy, Paul and Langley, Chris and Stolpner, Svetlana and Kelly, Jonathan and Waslander, Steven L.}, title = {FlowCLAS: Enhancing Normalizing Flow-Based Anomaly Segmentation Via Contrastive Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6998-7007} }
SuperRivolution: Fine-Scale Rivers from Coarse Temporal Satellite Imagery: Rangel Daroya,

Subhransu Maji; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Daroya_2026_WACV, author = {Daroya, Rangel and Maji, Subhransu}, title = {SuperRivolution: Fine-Scale Rivers from Coarse Temporal Satellite Imagery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7482-7492} }
R-MMA: Enhancing Vision-Language Models with Recurrent Adapters for Few-Shot and Cross-Domain Generalization: Md Fahim,

Md Farhan Ishmam,

Mir Sazzat Hossain,

M Ashraful Amin,

Amin Ahsan Ali,

AKM Mahbubur Rahman; [pdf] [supp]
[bibtex]
@InProceedings{Fahim_2026_WACV, author = {Fahim, Md and Ishmam, Md Farhan and Hossain, Mir Sazzat and Amin, M Ashraful and Ali, Amin Ahsan and Rahman, AKM Mahbubur}, title = {R-MMA: Enhancing Vision-Language Models with Recurrent Adapters for Few-Shot and Cross-Domain Generalization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6496-6506} }
TRACE: Confounder-free Adversarial Fine-tuning for Robust Object Detection: Wonho Lee,

Jisu Lee,

Hyunsik Na,

Sohee Park,

Daeseon Choi; [pdf] [supp]
[bibtex]
@InProceedings{Lee_2026_WACV, author = {Lee, Wonho and Lee, Jisu and Na, Hyunsik and Park, Sohee and Choi, Daeseon}, title = {TRACE: Confounder-free Adversarial Fine-tuning for Robust Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6705-6714} }
SOLAR: Switchable Output Layer for Accuracy and Robustness in Once-for-All Training: Shaharyar Ahmed Khan Tareen,

Lei Fan,

Xiaojing Yuan,

Qin Lin,

Bin Hu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Tareen_2026_WACV, author = {Tareen, Shaharyar Ahmed Khan and Fan, Lei and Yuan, Xiaojing and Lin, Qin and Hu, Bin}, title = {SOLAR: Switchable Output Layer for Accuracy and Robustness in Once-for-All Training}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7893-7902} }
DexAvatar: 3D Sign Language Reconstruction with Hand and Body Pose Priors: Kaustubh Kundu,

Hrishav Bakul Barua,

Lucy Robertson-Bell,

Zhixi Cai,

Kalin Stefanov; [pdf] [supp]
[bibtex]
@InProceedings{Kundu_2026_WACV, author = {Kundu, Kaustubh and Barua, Hrishav Bakul and Robertson-Bell, Lucy and Cai, Zhixi and Stefanov, Kalin}, title = {DexAvatar: 3D Sign Language Reconstruction with Hand and Body Pose Priors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5842-5852} }
SegMo: Segment-aligned Text to 3D Human Motion Generation: Bowen Dang,

Lin Wu,

Xiaohang Yang,

Zheng Yuan,

Zhixiang Chen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dang_2026_WACV, author = {Dang, Bowen and Wu, Lin and Yang, Xiaohang and Yuan, Zheng and Chen, Zhixiang}, title = {SegMo: Segment-aligned Text to 3D Human Motion Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6946-6955} }
SceneProp: Combining Neural Network and Markov Random Field for Scene-Graph Grounding: Keita Otani,

Tatsuya Harada; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Otani_2026_WACV, author = {Otani, Keita and Harada, Tatsuya}, title = {SceneProp: Combining Neural Network and Markov Random Field for Scene-Graph Grounding}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6153-6162} }
WiSAR3D - Aerial LiDAR Dataset for 3D Object Detection: Oren Shrout,

Ori Nizan,

Yizhak Ben-Shabat,

Ayellet Tal; [pdf] [supp]
[bibtex]
@InProceedings{Shrout_2026_WACV, author = {Shrout, Oren and Nizan, Ori and Ben-Shabat, Yizhak and Tal, Ayellet}, title = {WiSAR3D - Aerial LiDAR Dataset for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6580-6589} }
Exploiting Label-Independent Regularization from Spatial Patterns for Whole Slide Image Analysis: Weiyi Wu,

Xinwen Xu,

Chongyang Gao,

Xingjian Diao,

Siting Li,

Jiang Gui; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2026_WACV, author = {Wu, Weiyi and Xu, Xinwen and Gao, Chongyang and Diao, Xingjian and Li, Siting and Gui, Jiang}, title = {Exploiting Label-Independent Regularization from Spatial Patterns for Whole Slide Image Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8639-8649} }
Co-STAR: Collaborative Curriculum Self-Training with Adaptive Regularization for Source-Free Video Domain Adaptation: Amirhossein Dadashzadeh,

Parsa Esmati,

Majid Mirmehdi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dadashzadeh_2026_WACV, author = {Dadashzadeh, Amirhossein and Esmati, Parsa and Mirmehdi, Majid}, title = {Co-STAR: Collaborative Curriculum Self-Training with Adaptive Regularization for Source-Free Video Domain Adaptation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7821-7831} }
QuEENet: Quantum-Enhanced Expressive Network for Image Classification: Shashank Bayal,

Rushikesh Govind Dawane,

Komal Komal,

Santosh Kumar Vipparthi,

Subrahmanyam Murala; [pdf] [supp]
[bibtex]
@InProceedings{Bayal_2026_WACV, author = {Bayal, Shashank and Dawane, Rushikesh Govind and Komal, Komal and Vipparthi, Santosh Kumar and Murala, Subrahmanyam}, title = {QuEENet: Quantum-Enhanced Expressive Network for Image Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7883-7892} }
SHaSaM: Submodular Hard Sample Mining for Fair Facial Attribute Recognition: Anay Majee,

Rishabh Iyer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Majee_2026_WACV, author = {Majee, Anay and Iyer, Rishabh}, title = {SHaSaM: Submodular Hard Sample Mining for Fair Facial Attribute Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7461-7471} }
SGD-Mix: Enhancing Domain-Specific Image Classification with Label-Preserving Data Augmentation: Yixuan Dong,

Fang-Yi Su,

Jung-Hsien Chiang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Dong_2026_WACV, author = {Dong, Yixuan and Su, Fang-Yi and Chiang, Jung-Hsien}, title = {SGD-Mix: Enhancing Domain-Specific Image Classification with Label-Preserving Data Augmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7051-7061} }
Unsupervised Discovery of Long-Term Spatiotemporal Periodic Workflows in Human Activities: Fan Yang,

Quanting Xie,

Atsunori Moteki,

Shoichi Masui,

Shan Jiang,

Kanji Uchino,

Yonatan Bisk,

Graham Neubig; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2026_WACV, author = {Yang, Fan and Xie, Quanting and Moteki, Atsunori and Masui, Shoichi and Jiang, Shan and Uchino, Kanji and Bisk, Yonatan and Neubig, Graham}, title = {Unsupervised Discovery of Long-Term Spatiotemporal Periodic Workflows in Human Activities}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5821-5832} }
Revisiting an Old Perspective Projection for Monocular 3D Morphable Models Regression: Toby Chong,

Ryota Nakajima; [pdf] [arXiv]
[bibtex]
@InProceedings{Chong_2026_WACV, author = {Chong, Toby and Nakajima, Ryota}, title = {Revisiting an Old Perspective Projection for Monocular 3D Morphable Models Regression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7799-7808} }
SafeguardGS: 3D Gaussian Primitive Pruning While Avoiding Catastrophic Scene Destruction: Yongjae Lee,

Zhaoliang Zhang,

Deliang Fan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2026_WACV, author = {Lee, Yongjae and Zhang, Zhaoliang and Fan, Deliang}, title = {SafeguardGS: 3D Gaussian Primitive Pruning While Avoiding Catastrophic Scene Destruction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8479-8489} }
Deep Image Decomposition for Medical Imaging Anonymization and Curation: Yael Elkin,

Gal Ben-Arie,

Tammy Riklin-Raviv; [pdf] [supp]
[bibtex]
@InProceedings{Elkin_2026_WACV, author = {Elkin, Yael and Ben-Arie, Gal and Riklin-Raviv, Tammy}, title = {Deep Image Decomposition for Medical Imaging Anonymization and Curation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7229-7238} }
Clear Sights on Site: A Spatial-Adaptive Channel Network for Deblurring Construction Site Images: Mahdi Bonyani,

Maryam Soleymani,

Chao Wang; [pdf] [supp]
[bibtex]
@InProceedings{Bonyani_2026_WACV, author = {Bonyani, Mahdi and Soleymani, Maryam and Wang, Chao}, title = {Clear Sights on Site: A Spatial-Adaptive Channel Network for Deblurring Construction Site Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6936-6945} }
GRAPE (Gaussian Rendering for Accelerated Pixel Enhancement) Brings Fast and Lightweight Arbitrary Super-Resolution: Jung In Jang,

Kyong Hwan Jin; [pdf] [supp]
[bibtex]
@InProceedings{Jang_2026_WACV, author = {Jang, Jung In and Jin, Kyong Hwan}, title = {GRAPE (Gaussian Rendering for Accelerated Pixel Enhancement) Brings Fast and Lightweight Arbitrary Super-Resolution}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7750-7758} }
HodgeFormer: Transformers for Learnable Operators on Triangular Meshes through Data-Driven Hodge Matrices: Akis Nousias,

Stavros Nousias; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nousias_2026_WACV, author = {Nousias, Akis and Nousias, Stavros}, title = {HodgeFormer: Transformers for Learnable Operators on Triangular Meshes through Data-Driven Hodge Matrices}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6796-6805} }
Uplifting Table Tennis: A Robust, Real-World Application for 3D Trajectory and Spin Estimation: Daniel Kienzle,

Katja Ludwig,

Julian Lorenz,

Shin'Ichi Satoh,

Rainer Lienhart; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kienzle_2026_WACV, author = {Kienzle, Daniel and Ludwig, Katja and Lorenz, Julian and Satoh, Shin'Ichi and Lienhart, Rainer}, title = {Uplifting Table Tennis: A Robust, Real-World Application for 3D Trajectory and Spin Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7440-7449} }
GeneVA: A Dataset of Human Annotations for Generative Text to Video Artifacts: Jenna Kang,

Maria Beatriz Silva,

Patsorn Sangkloy,

Kenneth Chen,

Niall L. Williams,

Qi Sun; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kang_2026_WACV, author = {Kang, Jenna and Silva, Maria Beatriz and Sangkloy, Patsorn and Chen, Kenneth and Williams, Niall L. and Sun, Qi}, title = {GeneVA: A Dataset of Human Annotations for Generative Text to Video Artifacts}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6174-6183} }
Synthesizing Compositional Videos from Text Description: Prajwal Singh,

Kuldeep Kulkarni,

Shanmuganathan Raman,

Harsh Rangwani; [pdf] [supp]
[bibtex]
@InProceedings{Singh_2026_WACV, author = {Singh, Prajwal and Kulkarni, Kuldeep and Raman, Shanmuganathan and Rangwani, Harsh}, title = {Synthesizing Compositional Videos from Text Description}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6775-6784} }
SSMT-Net: A Semi-Supervised Multitask Transformer-Based Network for Thyroid Nodule Segmentation in Ultrasound Images: Muhammad Umar Farooq,

Abd Ur Rehman,

Azka Rehman,

Muhammad Usman,

Dong-Kyu Chae; [pdf]
[bibtex]
@InProceedings{Farooq_2026_WACV, author = {Farooq, Muhammad Umar and Rehman, Abd Ur and Rehman, Azka and Usman, Muhammad and Chae, Dong-Kyu}, title = {SSMT-Net: A Semi-Supervised Multitask Transformer-Based Network for Thyroid Nodule Segmentation in Ultrasound Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6069-6079} }
SAVE: Sparse Autoencoder-Driven Visual Information Enhancement for Mitigating Object Hallucination: Sangha Park,

Seungryong Yoo,

Jisoo Mok,

Sungroh Yoon; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Park_2026_WACV, author = {Park, Sangha and Yoo, Seungryong and Mok, Jisoo and Yoon, Sungroh}, title = {SAVE: Sparse Autoencoder-Driven Visual Information Enhancement for Mitigating Object Hallucination}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7935-7944} }
Non-Aligned Reference Image Quality Assessment for Novel View Synthesis: Abhijay Ghildyal,

Rajesh Sureddi,

Nabajeet Barman,

Saman Zadtootaghaj,

Alan C Bovik; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ghildyal_2026_WACV, author = {Ghildyal, Abhijay and Sureddi, Rajesh and Barman, Nabajeet and Zadtootaghaj, Saman and Bovik, Alan C}, title = {Non-Aligned Reference Image Quality Assessment for Novel View Synthesis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6350-6359} }
BAFLE-DCT: Bypassing Adversarial Filters via Frequency-Selective Embedding in the DCT Domain: Thilina Mendis,

Farah Kandah,

Sathyanarayanan N. Aakur; [pdf]
[bibtex]
@InProceedings{Mendis_2026_WACV, author = {Mendis, Thilina and Kandah, Farah and Aakur, Sathyanarayanan N.}, title = {BAFLE-DCT: Bypassing Adversarial Filters via Frequency-Selective Embedding in the DCT Domain}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5967-5976} }
VLMDiff: Leveraging Vision-Language Models for Multi-Class Anomaly Detection with Diffusion: Samet Hicsonmez,

Abd El Rahman Shabayek,

Djamila Aouada; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hicsonmez_2026_WACV, author = {Hicsonmez, Samet and El Rahman Shabayek, Abd and Aouada, Djamila}, title = {VLMDiff: Leveraging Vision-Language Models for Multi-Class Anomaly Detection with Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6309-6319} }
MapVerse: A Benchmark for Geospatial Question Answering on Diverse Real-World Maps: Sharat Bhat,

Harshita Khandelwal,

Tushar Kataria,

Vivek Gupta; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bhat_2026_WACV, author = {Bhat, Sharat and Khandelwal, Harshita and Kataria, Tushar and Gupta, Vivek}, title = {MapVerse: A Benchmark for Geospatial Question Answering on Diverse Real-World Maps}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8168-8178} }
Integrating Multi-scale and Multi-filtration Topological Features for Medical Image Classification: Pengfei Gu,

Huimin Li,

Haoteng Tang,

Dongkuan Xu,

Erik Enriquez,

DongChul Kim,

Bin Fu,

Danny Z Chen; [pdf] [arXiv]
[bibtex]
@InProceedings{Gu_2026_WACV, author = {Gu, Pengfei and Li, Huimin and Tang, Haoteng and Xu, Dongkuan and Enriquez, Erik and Kim, DongChul and Fu, Bin and Chen, Danny Z}, title = {Integrating Multi-scale and Multi-filtration Topological Features for Medical Image Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8660-8669} }
FlyPose: Towards Robust Human Pose Estimation From Aerial Views: Hassaan Farooq,

Marvin Brenner,

Peter Stütz; [pdf]
[bibtex]
@InProceedings{Farooq_2026_WACV, author = {Farooq, Hassaan and Brenner, Marvin and St\"utz, Peter}, title = {FlyPose: Towards Robust Human Pose Estimation From Aerial Views}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8617-8627} }
SAVeD: Learning to Denoise Low-SNR Video for Improved Downstream Performance: Suzanne Stathatos,

Michael Hobley,

Pietro Perona,

Markus Marks; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Stathatos_2026_WACV, author = {Stathatos, Suzanne and Hobley, Michael and Perona, Pietro and Marks, Markus}, title = {SAVeD: Learning to Denoise Low-SNR Video for Improved Downstream Performance}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6851-6861} }
See, Record, Do: Automated Generation of UI Workflows from Tutorial Videos: Adam Beauchaine,

Craig Shue; [pdf]
[bibtex]
@InProceedings{Beauchaine_2026_WACV, author = {Beauchaine, Adam and Shue, Craig}, title = {See, Record, Do: Automated Generation of UI Workflows from Tutorial Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6256-6265} }
VADER: Towards Causal Video Anomaly Understanding with Relation-Aware Large Language Models: Ying Cheng,

Yu-Ho Lin,

Min-Hung Chen,

Fu-En Yang,

Shang-Hong Lai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cheng_2026_WACV, author = {Cheng, Ying and Lin, Yu-Ho and Chen, Min-Hung and Yang, Fu-En and Lai, Shang-Hong}, title = {VADER: Towards Causal Video Anomaly Understanding with Relation-Aware Large Language Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7301-7311} }
Pretraining Helps When Capacity Allows: Evidence from Ultra-Small ConvNets: Srikanth Muralidharan,

Heitor R. Medeiros,

Masih Aminbeidokhti,

Eric Granger,

Marco Pedersoli; [pdf] [supp]
[bibtex]
@InProceedings{Muralidharan_2026_WACV, author = {Muralidharan, Srikanth and Medeiros, Heitor R. and Aminbeidokhti, Masih and Granger, Eric and Pedersoli, Marco}, title = {Pretraining Helps When Capacity Allows: Evidence from Ultra-Small ConvNets}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8333-8342} }
SmoothDiffusion-VE: Real-time Generative Video Editing Using Adaptive Feature Cache: Mustafa Munir,

Sophia Zalewski,

Shiqiu Liu,

David Tarjan,

Sushmitha Belede,

Anjul Patney,

Radu Marculescu; [pdf] [supp]
[bibtex]
@InProceedings{Munir_2026_WACV, author = {Munir, Mustafa and Zalewski, Sophia and Liu, Shiqiu and Tarjan, David and Belede, Sushmitha and Patney, Anjul and Marculescu, Radu}, title = {SmoothDiffusion-VE: Real-time Generative Video Editing Using Adaptive Feature Cache}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8468-8478} }
Leveraging Sparsity for Privacy in Collaborative Inference: Maximilian Andreas Hoefler,

Karsten Mueller,

Wojciech Samek; [pdf] [supp]
[bibtex]
@InProceedings{Hoefler_2026_WACV, author = {Hoefler, Maximilian Andreas and Mueller, Karsten and Samek, Wojciech}, title = {Leveraging Sparsity for Privacy in Collaborative Inference}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7596-7604} }
UltraClean: A Simple Framework to Train Robust Neural Networks against Backdoor Attacks: Bingyin Zhao,

Yingjie Lao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2026_WACV, author = {Zhao, Bingyin and Lao, Yingjie}, title = {UltraClean: A Simple Framework to Train Robust Neural Networks against Backdoor Attacks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8353-8363} }
QAL : A Loss for Recall-Precision Balance in 3D Reconstruction: Pranay Meshram,

Yash Turkar,

Kartikeya Singh,

Praveen Raj Masilamani,

Charuvahan Adhivarahan,

Karthik Dantu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Meshram_2026_WACV, author = {Meshram, Pranay and Turkar, Yash and Singh, Kartikeya and Masilamani, Praveen Raj and Adhivarahan, Charuvahan and Dantu, Karthik}, title = {QAL : A Loss for Recall-Precision Balance in 3D Reconstruction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7965-7974} }
DualRes: Production-ready Dynamic Object Detection: Jibril El Hassani,

Thomas Verelst; [pdf]
[bibtex]
@InProceedings{El_Hassani_2026_WACV, author = {El Hassani, Jibril and Verelst, Thomas}, title = {DualRes: Production-ready Dynamic Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7842-7851} }
Meta-YOLO: Metadata-Guided Real-Time Object Detector in Aerial Imagery: Deukryeol Yoon,

Seonghak Kim,

Young Hwa Sung,

Jinho Jung; [pdf] [supp]
[bibtex]
@InProceedings{Yoon_2026_WACV, author = {Yoon, Deukryeol and Kim, Seonghak and Sung, Young Hwa and Jung, Jinho}, title = {Meta-YOLO: Metadata-Guided Real-Time Object Detector in Aerial Imagery}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7975-7984} }
Generalized Category Discovery for LiDAR Semantic Segmentation: Minseok Kim,

Jiyong Boo,

Kuk-Jin Yoon; [pdf] [supp]
[bibtex]
@InProceedings{Kim_2026_WACV, author = {Kim, Minseok and Boo, Jiyong and Yoon, Kuk-Jin}, title = {Generalized Category Discovery for LiDAR Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8416-8426} }
NeuroBridge: Few-Shot Cross-Modal Neuron Re-identification via Dual-Channel Deep Metric Learning: Wenwei Li,

Mingwei Liao,

Lingyi Cai,

Anan Li; [pdf] [supp]
[bibtex]
@InProceedings{Li_2026_WACV, author = {Li, Wenwei and Liao, Mingwei and Cai, Lingyi and Li, Anan}, title = {NeuroBridge: Few-Shot Cross-Modal Neuron Re-identification via Dual-Channel Deep Metric Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8670-8679} }
IPTQ-ViT: Post-Training Quantization of Non-linear Functions for Integer-only Vision Transformers: Gihwan Kim,

Jemin Lee,

Hyungshin Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2026_WACV, author = {Kim, Gihwan and Lee, Jemin and Kim, Hyungshin}, title = {IPTQ-ViT: Post-Training Quantization of Non-linear Functions for Integer-only Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7366-7375} }
Denoise, Divide, Distill, and Predict (D3P): Towards Forecasting Long-horizon Real-world Anomaly from Normalcy: Quentin Mérilleau,

Snehashis Majhi,

Antitza Dantcheva,

Quan Kong,

Lorenzo Garattoni,

Gianpiero Francesca,

Francois Bremond; [pdf]
[bibtex]
@InProceedings{Merilleau_2026_WACV, author = {M\'erilleau, Quentin and Majhi, Snehashis and Dantcheva, Antitza and Kong, Quan and Garattoni, Lorenzo and Francesca, Gianpiero and Bremond, Francois}, title = {Denoise, Divide, Distill, and Predict (D3P): Towards Forecasting Long-horizon Real-world Anomaly from Normalcy}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6246-6255} }
Zero-Shot Domain Generalisation via Prompt-Driven Feature Refinement: Tingrui Qiao,

Di Zhao,

Caroline Walker,

Chris Cunningham,

Yun Sing Koh; [pdf]
[bibtex]
@InProceedings{Qiao_2026_WACV, author = {Qiao, Tingrui and Zhao, Di and Walker, Caroline and Cunningham, Chris and Koh, Yun Sing}, title = {Zero-Shot Domain Generalisation via Prompt-Driven Feature Refinement}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6184-6193} }
Generalizing Sports Feedback Generation by Watching Competitions and Reading Books: A Rock Climbing Case Study: Arushi Rai,

Adriana Kovashka; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rai_2026_WACV, author = {Rai, Arushi and Kovashka, Adriana}, title = {Generalizing Sports Feedback Generation by Watching Competitions and Reading Books: A Rock Climbing Case Study}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8136-8145} }
Neural Geometry Image-Based Representations with Optimal Transport (OT): Xiang Gao,

Yuanpeng Liu,

Jiazhi Li,

Xinmu Wang,

Minghao Guo,

Yu Guo,

Xiyun Song,

Heather Yu,

Zhiqiang Lao,

Xianfeng David Gu; [pdf] [arXiv]
[bibtex]
@InProceedings{Gao_2026_WACV, author = {Gao, Xiang and Liu, Yuanpeng and Li, Jiazhi and Wang, Xinmu and Guo, Minghao and Guo, Yu and Song, Xiyun and Yu, Heather and Lao, Zhiqiang and Gu, Xianfeng David}, title = {Neural Geometry Image-Based Representations with Optimal Transport (OT)}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6676-6686} }
Multimodal Adversarial Defense for Vision-Language Models by Leveraging One-To-Many Relationships: Futa Waseda,

Antonio Tejero-de-Pablos,

Isao Echizen; [pdf] [supp]
[bibtex]
@InProceedings{Waseda_2026_WACV, author = {Waseda, Futa and Tejero-de-Pablos, Antonio and Echizen, Isao}, title = {Multimodal Adversarial Defense for Vision-Language Models by Leveraging One-To-Many Relationships}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6968-6977} }
Sketch3R: Rapid and Realistic 3D VR Sketch Creation to Shape Retrieval: Mritunjoy Halder,

Shivam Ashok Shukla,

Lokender Tiwari,

Raghav Mittal,

Brojeshwar Bhowmick; [pdf] [supp]
[bibtex]
@InProceedings{Halder_2026_WACV, author = {Halder, Mritunjoy and Shukla, Shivam Ashok and Tiwari, Lokender and Mittal, Raghav and Bhowmick, Brojeshwar}, title = {Sketch3R: Rapid and Realistic 3D VR Sketch Creation to Shape Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8680-8689} }
MapleGrasp: Mask-guided Feature Pooling for Language-driven Efficient Robotic Grasping: Vineet Bhat,

Naman Patel,

Prashanth Krishnamurthy,

Ramesh Karri,

Farshad Khorrami; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bhat_2026_WACV, author = {Bhat, Vineet and Patel, Naman and Krishnamurthy, Prashanth and Karri, Ramesh and Khorrami, Farshad}, title = {MapleGrasp: Mask-guided Feature Pooling for Language-driven Efficient Robotic Grasping}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7554-7564} }
QUOTA: Quantifying Objects with Text-to-Image Models for Any Domain: Wenfang Sun,

Yingjun Du,

Gaowen Liu,

Yefeng Zheng,

Cees G. M. Snoek; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sun_2026_WACV, author = {Sun, Wenfang and Du, Yingjun and Liu, Gaowen and Zheng, Yefeng and Snoek, Cees G. M.}, title = {QUOTA: Quantifying Objects with Text-to-Image Models for Any Domain}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6381-6390} }
Chain-of-Look Spatial Reasoning for Dense Surgical Instrument Counting: Rishikesh Bhyri,

Brian R Quaranto,

Junsong Yuan,

Peter C W Kim,

Nan Xi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bhyri_2026_WACV, author = {Bhyri, Rishikesh and Quaranto, Brian R and Yuan, Junsong and Kim, Peter C W and Xi, Nan}, title = {Chain-of-Look Spatial Reasoning for Dense Surgical Instrument Counting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8521-8530} }
Towards Fine-Grained Adaptation of CLIP via a Self-Trained Alignment Score: Eman Ali,

Sathira Silva,

Chetan Arora,

Muhammad Haris Khan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Ali_2026_WACV, author = {Ali, Eman and Silva, Sathira and Arora, Chetan and Khan, Muhammad Haris}, title = {Towards Fine-Grained Adaptation of CLIP via a Self-Trained Alignment Score}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5875-5885} }
GFT-GCN: Privacy-Preserving 3D Face Mesh Recognition with Spectral Diffusion: Hichem Felouat,

Hanrui Wang,

Isao Echizen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Felouat_2026_WACV, author = {Felouat, Hichem and Wang, Hanrui and Echizen, Isao}, title = {GFT-GCN: Privacy-Preserving 3D Face Mesh Recognition with Spectral Diffusion}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6236-6245} }
Disentangle and Regularize: Sign Language Production with Articulator-Based Disentanglement and Channel-Aware Regularization: Sümeyye Meryem Taşyürek,

Tuğçe Kızıltepe,

Hacer Yalim Keles; [pdf] [supp]
[bibtex]
@InProceedings{Tasyurek_2026_WACV, author = {Ta\c{s}y\"urek, S\"umeyye Meryem and K{\i}z{\i}ltepe, Tu\u{g}\c{c}e and Keles, Hacer Yalim}, title = {Disentangle and Regularize: Sign Language Production with Articulator-Based Disentanglement and Channel-Aware Regularization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8458-8467} }
MIST: Multilingual Incidental Dataset for Scene Text Detection: Saumya Mundra,

Ajoy Mondal,

C.V. Jawahar; [pdf] [supp]
[bibtex]
@InProceedings{Mundra_2026_WACV, author = {Mundra, Saumya and Mondal, Ajoy and Jawahar, C.V.}, title = {MIST: Multilingual Incidental Dataset for Scene Text Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7658-7667} }
VAST-ReID: A Low-Light Benchmark Dataset for Person Re-Identification with Visual and Attribute-Rich Semantic Tracking: Hammad Khan,

Rakesh Kumar Giri,

Kamalakar Vijay Thakare,

Heeseung Choi,

Hyungjoo Jung,

Debi Prosad Dogra,

Ig-Jae Kim; [pdf] [supp]
[bibtex]
@InProceedings{Khan_2026_WACV, author = {Khan, Hammad and Giri, Rakesh Kumar and Thakare, Kamalakar Vijay and Choi, Heeseung and Jung, Hyungjoo and Dogra, Debi Prosad and Kim, Ig-Jae}, title = {VAST-ReID: A Low-Light Benchmark Dataset for Person Re-Identification with Visual and Attribute-Rich Semantic Tracking}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5833-5841} }
Robust Scene Coordinate Regression via Geometrically-Consistent Global Descriptors: Son Tung Nguyen,

Alejandro Fontan,

Michael Milford,

Tobias Fischer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Nguyen_2026_WACV, author = {Nguyen, Son Tung and Fontan, Alejandro and Milford, Michael and Fischer, Tobias}, title = {Robust Scene Coordinate Regression via Geometrically-Consistent Global Descriptors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8209-8219} }
PointSt3R: Point Tracking through 3D Ground Correspondence: Rhodri Guerrier,

Adam W. Harley,

Dima Damen; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Guerrier_2026_WACV, author = {Guerrier, Rhodri and Harley, Adam W. and Damen, Dima}, title = {PointSt3R: Point Tracking through 3D Ground Correspondence}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7430-7439} }
NoHumansRequired: Autonomous High-Quality Image Editing Triplet Mining: Maksim Kuprashevich,

Grigorii Alekseenko,

Irina Tolstykh,

Georgii Fedorov,

Bulat Suleimanov,

Vladimir Dokholyan,

Aleksandr Gordeev; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kuprashevich_2026_WACV, author = {Kuprashevich, Maksim and Alekseenko, Grigorii and Tolstykh, Irina and Fedorov, Georgii and Suleimanov, Bulat and Dokholyan, Vladimir and Gordeev, Aleksandr}, title = {NoHumansRequired: Autonomous High-Quality Image Editing Triplet Mining}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6059-6068} }
DuPLUS: Dual-Prompt Vision-Language Model for Universal Medical Image Segmentation and Prognosis: Numan Saeed,

Tausifa Jan Saleem,

Fadillah Maani,

Muhammad Ridzuan,

Hu Wang,

Mohammad Yaqub; [pdf] [supp]
[bibtex]
@InProceedings{Saeed_2026_WACV, author = {Saeed, Numan and Saleem, Tausifa Jan and Maani, Fadillah and Ridzuan, Muhammad and Wang, Hu and Yaqub, Mohammad}, title = {DuPLUS: Dual-Prompt Vision-Language Model for Universal Medical Image Segmentation and Prognosis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8386-8395} }
Relevance-aware Multi-context Contrastive Decoding for Retrieval-augmented Visual Question Answering: Jongha Kim,

Byungoh Ko,

Jeehye Na,

Jinsung Yoon,

Hyunwoo J. Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kim_2026_WACV, author = {Kim, Jongha and Ko, Byungoh and Na, Jeehye and Yoon, Jinsung and Kim, Hyunwoo J.}, title = {Relevance-aware Multi-context Contrastive Decoding for Retrieval-augmented Visual Question Answering}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8596-8605} }
Image-Guided Semantic Pseudo-LiDAR Point Generation for 3D Object Detection: Minseung Lee,

Seokha Moon,

Seung Joon Lee,

Reza Mahjourian,

Jinkyu Kim; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2026_WACV, author = {Lee, Minseung and Moon, Seokha and Lee, Seung Joon and Mahjourian, Reza and Kim, Jinkyu}, title = {Image-Guided Semantic Pseudo-LiDAR Point Generation for 3D Object Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7137-7147} }
Intraoperative 2D/3D Registration via Spherical Similarity Learning and Differentiable Levenberg-Marquardt Optimization: Minheng Chen,

Youyong Kong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2026_WACV, author = {Chen, Minheng and Kong, Youyong}, title = {Intraoperative 2D/3D Registration via Spherical Similarity Learning and Differentiable Levenberg-Marquardt Optimization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7239-7249} }
Bridging the Domain Gap in Small Multimodal Models: A Dual-level Alignment Perspective: Aveen Dayal,

Peketi Divya,

Nidhi Tiwari,

Linga Reddy Cenkeramaddi,

C Krishna Mohan,

Abhinav Kumar; [pdf] [supp]
[bibtex]
@InProceedings{Dayal_2026_WACV, author = {Dayal, Aveen and Divya, Peketi and Tiwari, Nidhi and Cenkeramaddi, Linga Reddy and Mohan, C Krishna and Kumar, Abhinav}, title = {Bridging the Domain Gap in Small Multimodal Models: A Dual-level Alignment Perspective}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8262-8271} }
ChartQA-X: Generating Explanations for Visual Chart Reasoning: Shamanthak Hegde,

Pooyan Fazli,

Hasti Seifi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hegde_2026_WACV, author = {Hegde, Shamanthak and Fazli, Pooyan and Seifi, Hasti}, title = {ChartQA-X: Generating Explanations for Visual Chart Reasoning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6453-6463} }
RealDroneVision: Dataset and Architecture Advancements for Small-Object Drone Detection: Arun Kumar Sivapuram,

Pranav R T Peddinti,

Harish Puppala,

Komuravelli Prashanth,

Jaladi Sri Harsha,

Rama Krishna Sai Gorthi; [pdf] [supp]
[bibtex]
@InProceedings{Sivapuram_2026_WACV, author = {Sivapuram, Arun Kumar and Peddinti, Pranav R T and Puppala, Harish and Prashanth, Komuravelli and Harsha, Jaladi Sri and Gorthi, Rama Krishna Sai}, title = {RealDroneVision: Dataset and Architecture Advancements for Small-Object Drone Detection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6687-6695} }
brat: Aligned Multi-View Embeddings for Brain MRI Analysis: Maxime Kayser,

Maksim Gridnev,

Wanting Wang,

Max Bain,

Aneesh Rangnekar,

Avijit Chatterjee,

Aleksandr Petrov,

Harini Veeraraghavan,

Nathaniel C. Swinburne; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kayser_2026_WACV, author = {Kayser, Maxime and Gridnev, Maksim and Wang, Wanting and Bain, Max and Rangnekar, Aneesh and Chatterjee, Avijit and Petrov, Aleksandr and Veeraraghavan, Harini and Swinburne, Nathaniel C.}, title = {brat: Aligned Multi-View Embeddings for Brain MRI Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5864-5874} }
Histogram Assisted Quality Aware Generative Model for Resolution Invariant NIR Image Colorization: Abhinav Attri,

Rajeev Ranjan Dwivedi,

Samiran Das,

Vinod Kumar Kurmi; [pdf] [arXiv]
[bibtex]
@InProceedings{Attri_2026_WACV, author = {Attri, Abhinav and Dwivedi, Rajeev Ranjan and Das, Samiran and Kurmi, Vinod Kumar}, title = {Histogram Assisted Quality Aware Generative Model for Resolution Invariant NIR Image Colorization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6422-6431} }
Fetal and Neonatal Cortical Surface Reconstruction with Anatomical Normal-guidance and Perceptual Enhancements: Jiyang Lee,

Woori Bae,

U-Geun Ji,

Hanyeol Yang,

Jong-Min Lee; [pdf]
[bibtex]
@InProceedings{Lee_2026_WACV, author = {Lee, Jiyang and Bae, Woori and Ji, U-Geun and Yang, Hanyeol and Lee, Jong-Min}, title = {Fetal and Neonatal Cortical Surface Reconstruction with Anatomical Normal-guidance and Perceptual Enhancements}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7759-7768} }
TriaGS: Differentiable Triangulation-Guided Geometric Consistency for 3D Gaussian Splatting: Quan Tran,

Tuan Dang; [pdf] [arXiv]
[bibtex]
@InProceedings{Tran_2026_WACV, author = {Tran, Quan and Dang, Tuan}, title = {TriaGS: Differentiable Triangulation-Guided Geometric Consistency for 3D Gaussian Splatting}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8396-8405} }
PALMS+: Modular Image-Based Floor Plan Localization Leveraging Depth Foundation Model: Yunqian Cheng,

Benjamin Princen,

Roberto Manduchi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cheng_2026_WACV, author = {Cheng, Yunqian and Princen, Benjamin and Manduchi, Roberto}, title = {PALMS+: Modular Image-Based Floor Plan Localization Leveraging Depth Foundation Model}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7084-7093} }
Advancing Player Identification and Tracking with Global ID Fusion (GIF): Karol Wojtulewicz,

Minxing Liu,

Niklas Carlsson; [pdf] [supp]
[bibtex]
@InProceedings{Wojtulewicz_2026_WACV, author = {Wojtulewicz, Karol and Liu, Minxing and Carlsson, Niklas}, title = {Advancing Player Identification and Tracking with Global ID Fusion (GIF)}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7269-7280} }
VRAgent: Self-Refining Agent for Zero-Shot Multimodal Video Retrieval: Ketul Shah,

Pankaj Nathani,

Rama Chellappa,

Fabian Caba Heilbron; [pdf] [supp]
[bibtex]
@InProceedings{Shah_2026_WACV, author = {Shah, Ketul and Nathani, Pankaj and Chellappa, Rama and Heilbron, Fabian Caba}, title = {VRAgent: Self-Refining Agent for Zero-Shot Multimodal Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8157-8167} }
Alignment and Distillation: A Robust Framework for Multimodal Domain Generalizable Human Action Recognition: Hyeonbin Ji,

Juyeob Lee,

Eunil Park; [pdf]
[bibtex]
@InProceedings{Ji_2026_WACV, author = {Ji, Hyeonbin and Lee, Juyeob and Park, Eunil}, title = {Alignment and Distillation: A Robust Framework for Multimodal Domain Generalizable Human Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6913-6924} }
Correcting and Quantifying Systematic Errors in 3D Box Annotations for Autonomous Driving: Alexandre Justo Miro,

Ludvig af Klinteberg,

Bogdan Timus,

Aron Asefaw,

Ajinkya Khoche,

Thomas Gustafsson,

Sina Sharif Mansouri,

Masoud Daneshtalab; [pdf] [arXiv]
[bibtex]
@InProceedings{Miro_2026_WACV, author = {Miro, Alexandre Justo and af Klinteberg, Ludvig and Timus, Bogdan and Asefaw, Aron and Khoche, Ajinkya and Gustafsson, Thomas and Mansouri, Sina Sharif and Daneshtalab, Masoud}, title = {Correcting and Quantifying Systematic Errors in 3D Box Annotations for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6724-6732} }
CaFlow: Enhancing Long-Term Action Quality Assessment with Causal Counterfactual Flow: Ruisheng Han,

Kanglei Zhou,

Shuang Chen,

Amir Atapour-Abarghouei,

Hubert P. H. Shum; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Han_2026_WACV, author = {Han, Ruisheng and Zhou, Kanglei and Chen, Shuang and Atapour-Abarghouei, Amir and Shum, Hubert P. H.}, title = {CaFlow: Enhancing Long-Term Action Quality Assessment with Causal Counterfactual Flow}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8231-8241} }
Learning Beyond Labels: Self-Supervised Handwritten Text Recognition: Shree Mitra,

Ajoy Mondal,

C.V. Jawahar; [pdf] [supp]
[bibtex]
@InProceedings{Mitra_2026_WACV, author = {Mitra, Shree and Mondal, Ajoy and Jawahar, C.V.}, title = {Learning Beyond Labels: Self-Supervised Handwritten Text Recognition}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6653-6663} }
KMOPS: Keypoint-Driven Method for Multi-Object Pose and Metric Size Estimation from Stereo Images: Ying-Kun Wu,

Yi Shen,

Tzuhsuan Huang,

I-Sheng Fang,

Jun-Cheng Chen; [pdf] [supp]
[bibtex]
@InProceedings{Wu_2026_WACV, author = {Wu, Ying-Kun and Shen, Yi and Huang, Tzuhsuan and Fang, I-Sheng and Chen, Jun-Cheng}, title = {KMOPS: Keypoint-Driven Method for Multi-Object Pose and Metric Size Estimation from Stereo Images}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7730-7739} }
Isolating the Role of Temporal Information in Video Saliency: A Controlled Experimental Analysis: Peter El-Jiz,

Matthias Kuemmerer,

Matthias Tangemann,

Matthias Bethge,

Andreas Bartels,

Michael Mario Bannert; [pdf] [supp]
[bibtex]
@InProceedings{El-Jiz_2026_WACV, author = {El-Jiz, Peter and Kuemmerer, Matthias and Tangemann, Matthias and Bethge, Matthias and Bartels, Andreas and Bannert, Michael Mario}, title = {Isolating the Role of Temporal Information in Video Saliency: A Controlled Experimental Analysis}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {5909-5918} }
ScoreNet: Netting Lightweight Quality Scores for Better Visual Assessment with Large Multi-Modality Models: Bahador Rashidi,

Kiarash Aghakasiri,

Shupei Zhang,

Amirmohsen Sattarifard,

Yue Zhang,

Chao Gao; [pdf] [supp]
[bibtex]
@InProceedings{Rashidi_2026_WACV, author = {Rashidi, Bahador and Aghakasiri, Kiarash and Zhang, Shupei and Sattarifard, Amirmohsen and Zhang, Yue and Gao, Chao}, title = {ScoreNet: Netting Lightweight Quality Scores for Better Visual Assessment with Large Multi-Modality Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7008-7018} }
Digital Forensic AI You Can Explain: A Case Study on Video Source Camera Identification: Maryna Veksler,

Kemal Akkaya,

Selcuk Uluagac; [pdf]
[bibtex]
@InProceedings{Veksler_2026_WACV, author = {Veksler, Maryna and Akkaya, Kemal and Uluagac, Selcuk}, title = {Digital Forensic AI You Can Explain: A Case Study on Video Source Camera Identification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7030-7039} }
CoreCaption: Core Caption based Text-to-Video Retrieval: Junkyu Jang; [pdf] [supp]
[bibtex]
@InProceedings{Jang_2026_WACV, author = {Jang, Junkyu}, title = {CoreCaption: Core Caption based Text-to-Video Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6600-6610} }
Semantic Map Guided Bird's-Eye View Learning for Online HD Map Construction: Huantao Ren,

Hesham M. Eraqi,

ABM Musa,

Mohamed Moustafa; [pdf]
[bibtex]
@InProceedings{Ren_2026_WACV, author = {Ren, Huantao and Eraqi, Hesham M. and Musa, ABM and Moustafa, Mohamed}, title = {Semantic Map Guided Bird's-Eye View Learning for Online HD Map Construction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7852-7861} }
Enhancing Monocular 3D Hand Reconstruction with Learned Texture Priors: Giorgos Karvounas,

Nikolaos Kyriazis,

Iason Oikonomidis,

Georgios Pavlakos,

Antonis A. Argyros; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Karvounas_2026_WACV, author = {Karvounas, Giorgos and Kyriazis, Nikolaos and Oikonomidis, Iason and Pavlakos, Georgios and Argyros, Antonis A.}, title = {Enhancing Monocular 3D Hand Reconstruction with Learned Texture Priors}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7073-7083} }
ACuRE: Accurate Continuity-Regularized SpO2 Estimation Using Liquid Time-Constant Networks: Shahzad Ahmad,

Divya Mishra,

Sania Bano,

Sukalpa Chanda,

Yogesh Singh Rawat; [pdf] [supp]
[bibtex]
@InProceedings{Ahmad_2026_WACV, author = {Ahmad, Shahzad and Mishra, Divya and Bano, Sania and Chanda, Sukalpa and Rawat, Yogesh Singh}, title = {ACuRE: Accurate Continuity-Regularized SpO2 Estimation Using Liquid Time-Constant Networks}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {7250-7259} }
SceneShine: Illumination-aware Human Scene Gaussian Re-Splatting from Mobile Device Video: Xuqian Ren,

Wenjia Wang,

Mai Ngoc Nguyen,

Juho Kannala,

Esa Rahtu; [pdf] [supp]
[bibtex]
@InProceedings{Ren_2026_WACV, author = {Ren, Xuqian and Wang, Wenjia and Nguyen, Mai Ngoc and Kannala, Juho and Rahtu, Esa}, title = {SceneShine: Illumination-aware Human Scene Gaussian Re-Splatting from Mobile Device Video}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {8302-8312} }
T2VWorldBench: A Benchmark for Evaluating World Knowledge in Text-to-Video Generation: Yubin Chen,

Xuyang Guo,

Zhenmei Shi,

Zhao Song,

Jiahao Zhang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chen_2026_WACV, author = {Chen, Yubin and Guo, Xuyang and Shi, Zhenmei and Song, Zhao and Zhang, Jiahao}, title = {T2VWorldBench: A Benchmark for Evaluating World Knowledge in Text-to-Video Generation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)}, month = {March}, year = {2026}, pages = {6474-6485} }; Back