Papers
Generative Self-Supervised Learning for Medical Image Classification-
[pdf]
[supp]
[bibtex]@InProceedings{Park_2024_ACCV, author = {Park, Inhyuk and Kim, Sungeun and Ryu, Jongbin}, title = {Generative Self-Supervised Learning for Medical Image Classification}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {976-993} }
Depth Attention for Robust RGB Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2024_ACCV, author = {Liu, Yu and Mahmood, Arif and Khan, Muhammad Haris}, title = {Depth Attention for Robust RGB Tracking}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {213-231} }
MedBLIP: Bootstrapping Language-Image Pre-training from 3D Medical Images and Texts-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2024_ACCV, author = {Chen, Qiuhui and Hong, Yi}, title = {MedBLIP: Bootstrapping Language-Image Pre-training from 3D Medical Images and Texts}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2404-2420} }
Neural Active Structure-from-Motion in Dark and Textureless Environment-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ichimaru_2024_ACCV, author = {Ichimaru, Kazuto and Thomas, Diego and Iwaguchi, Takafumi and Kawasaki, Hiroshi}, title = {Neural Active Structure-from-Motion in Dark and Textureless Environment}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2145-2161} }
LoGDesc: Local geometric features aggregation for robust point cloud registration-
[pdf]
[arXiv]
[bibtex]@InProceedings{Slimani_2024_ACCV, author = {Slimani, Karim and Tamadazte, Brahim and Achard, Catherine}, title = {LoGDesc: Local geometric features aggregation for robust point cloud registration}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1952-1968} }
OmniFusion: Exemplar-based Video Colorization Using OmniMotion and Diffusion Priors-
[pdf]
[bibtex]@InProceedings{Fang_2024_ACCV, author = {Fang, Xiaoyuan and Dai, Longquan and Tang, Jinhui}, title = {OmniFusion: Exemplar-based Video Colorization Using OmniMotion and Diffusion Priors}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1215-1232} }
Contrastive Learning using Synthetic Images Generated from Real Images-
[pdf]
[bibtex]@InProceedings{Sasaya_2024_ACCV, author = {Sasaya, Tenta and Yamamoto, Shintaro and Ida, Takashi and Takimoto, Takahiro}, title = {Contrastive Learning using Synthetic Images Generated from Real Images}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {887-903} }
iS-MAP: Neural Implicit Mapping and Positioning for Structural Environments-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2024_ACCV, author = {Wang, Haocheng and Cao, Yanlong and Shou, Yejun and Shen, Lingfeng and Wei, Xiaoyao and Xu, Zhijie and Ren, Kai}, title = {iS-MAP: Neural Implicit Mapping and Positioning for Structural Environments}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {747-763} }
A Universal Structure of YOLO Series Small Object Detection Models-
[pdf]
[bibtex]@InProceedings{Hu_2024_ACCV, author = {Hu, Shengchao and Liu, Xiao and Wang, Weijun and Huang, Tianlun and Feng, Wei}, title = {A Universal Structure of YOLO Series Small Object Detection Models}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3706-3722} }
Decoupled DETR For Few-shot Object Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shangguan_2024_ACCV, author = {Shangguan, Zeyu and Huai, Lian and Liu, Tong and Liu, Yuyu and Jiang, Xingqun}, title = {Decoupled DETR For Few-shot Object Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {286-302} }
GaitW: Enhancing Gait Recognition in the Wild using Dynamic Information-
[pdf]
[supp]
[bibtex]@InProceedings{Thapar_2024_ACCV, author = {Thapar, Daksh and Chaudhari, Jayesh and Manchanda, Sunny and Nigam, Aditya and Arora, Chetan}, title = {GaitW: Enhancing Gait Recognition in the Wild using Dynamic Information}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {268-285} }
ELLAR: An Action Recognition Dataset for Extremely Low-Light Conditions with Dual Gamma Adaptive Modulation-
[pdf]
[supp]
[bibtex]@InProceedings{Ha_2024_ACCV, author = {Ha, Minse and Bae, Wan-Gi and Bae, Geunyoung and Lee, Jong Taek}, title = {ELLAR: An Action Recognition Dataset for Extremely Low-Light Conditions with Dual Gamma Adaptive Modulation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {800-817} }
EmoTalker: Audio Driven Emotion Aware Talking Head Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Shen_2024_ACCV, author = {Shen, Xiaoqian and Khan, Faizan Farooq and Elhoseiny, Mohamed}, title = {EmoTalker: Audio Driven Emotion Aware Talking Head Generation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1900-1917} }
Bringing Masked Autoencoders Explicit Contrastive Properties for Point Cloud Self-Supervised Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ren_2024_ACCV, author = {Ren, Bin and Mei, Guofeng and Paudel, Danda Pani and Wang, Weijie and Li, Yawei and Liu, Mengyuan and Cucchiara, Rita and Van Gool, Luc and Sebe, Nicu}, title = {Bringing Masked Autoencoders Explicit Contrastive Properties for Point Cloud Self-Supervised Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2034-2052} }
Dense Trajectory Fields: Consistent and Efficient Spatio-Temporal Pixel Tracking-
[pdf]
[bibtex]@InProceedings{Tournadre_2024_ACCV, author = {Tournadre, Marc and Soladi\'e, Catherine and Stoiber, Nicolas and Richard, Pierre-Yves}, title = {Dense Trajectory Fields: Consistent and Efficient Spatio-Temporal Pixel Tracking}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2212-2230} }
Dual Memory Networks Guided Reverse Distillation for Unsupervised Anomaly Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Tran_2024_ACCV, author = {Tran, Chi Dai and Pham, Long Hoang and Tran, Duong Nguyen-Ngoc and Ho, Quoc Pham-Nam and Jeon, Jae Wook}, title = {Dual Memory Networks Guided Reverse Distillation for Unsupervised Anomaly Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2650-2666} }
BiEfficient: Bidirectionally Prompting Vision-Language Models for Parameter-Efficient Video Recognition-
[pdf]
[bibtex]@InProceedings{He_2024_ACCV, author = {He, Haichen and Liu, Weibin and Xing, Weiwei}, title = {BiEfficient: Bidirectionally Prompting Vision-Language Models for Parameter-Efficient Video Recognition}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {108-125} }
Event-based Image Enhancement Under High Dynamic Range Scenarios-
[pdf]
[bibtex]@InProceedings{Weng_2024_ACCV, author = {Weng, Jingchong and Li, Boyang and Huang, Kai}, title = {Event-based Image Enhancement Under High Dynamic Range Scenarios}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2456-2470} }
PARNet: Aortic Reconstruction from Orthogonal X-rays Using Pre-Trained Generative Adversarial Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Cao_2024_ACCV, author = {Cao, Chengwei and Zhang, Jinhui and Gao, Yueyang and Li, Zheng}, title = {PARNet: Aortic Reconstruction from Orthogonal X-rays Using Pre-Trained Generative Adversarial Networks}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {852-869} }
Multi-path Segmentation Network Based on CNN and Transformer for Skin Lesion Image-
[pdf]
[bibtex]@InProceedings{Nie_2024_ACCV, author = {Nie, Tianyu and Zhao, Yishi and Yao, Shihong}, title = {Multi-path Segmentation Network Based on CNN and Transformer for Skin Lesion Image}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3137-3153} }
Hi-NeRF: Hybridizing 2D Inpainting with Neural Radiance Fields for 3D Scene Inpainting-
[pdf]
[supp]
[bibtex]@InProceedings{Huang_2024_ACCV, author = {Huang, Xianliang and Chen, Shuhang and Zhong, Zhizhou and Gou, Jiajie and Guan, Jihong and Zhou, Shuigeng}, title = {Hi-NeRF: Hybridizing 2D Inpainting with Neural Radiance Fields for 3D Scene Inpainting}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2855-2871} }
Adaptive Bias Discovery for Learning Debiased Classifier-
[pdf]
[supp]
[bibtex]@InProceedings{Bae_2024_ACCV, author = {Bae, Jun-Hyun and Lee, Minho and Jung, Heechul}, title = {Adaptive Bias Discovery for Learning Debiased Classifier}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3074-3090} }
FocusNet: Cascaded Lightweight Networks and Ascending Feature Enhancement for Efficient Salient Object Detection-
[pdf]
[bibtex]@InProceedings{Zhou_2024_ACCV, author = {Zhou, Chiheng and Zhou, Yongxia and Pan, Chen}, title = {FocusNet: Cascaded Lightweight Networks and Ascending Feature Enhancement for Efficient Salient Object Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2388-2403} }
InstantGeoAvatar: Effective Geometry and Appearance Modeling of Animatable Avatars from Monocular Video-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Budria_2024_ACCV, author = {Budria, Alvaro and Lopez-Rodriguez, Adrian and Lorente, \`Oscar and Moreno-Noguer, Francesc}, title = {InstantGeoAvatar: Effective Geometry and Appearance Modeling of Animatable Avatars from Monocular Video}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1827-1848} }
Neural Substitution for Branch-level Network Re-parameterization-
[pdf]
[supp]
[bibtex]@InProceedings{Oh_2024_ACCV, author = {Oh, Seungmin and Ryu, Jongbin}, title = {Neural Substitution for Branch-level Network Re-parameterization}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {959-975} }
ATTIQA: Generalizable Image Quality Feature Extractor using Attribute-aware Pretraining-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kwon_2024_ACCV, author = {Kwon, Daekyu and Kim, Dongyoung and Ki, Sehwan and Jo, Younghyun and Lee, Hyong-Euk and Kim, Seon Joo}, title = {ATTIQA: Generalizable Image Quality Feature Extractor using Attribute-aware Pretraining}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4526-4543} }
Seeing Through Expert's Eyes: Leveraging Radiologist Eye Gaze and Speech Report with Graph Neural Networks for Chest X-ray Image Classification-
[pdf]
[bibtex]@InProceedings{Sultana_2024_ACCV, author = {Sultana, Jamalia and Qin, Ruwen and Yin, Zhaozheng}, title = {Seeing Through Expert's Eyes: Leveraging Radiologist Eye Gaze and Speech Report with Graph Neural Networks for Chest X-ray Image Classification}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2579-2595} }
Instance-Dependent Noise Refinement in Segment Anything Model for Weakly Supervised Object Detection-
[pdf]
[bibtex]@InProceedings{Taherkhani_2024_ACCV, author = {Taherkhani, Fariborz and Kazemi, Ehsan}, title = {Instance-Dependent Noise Refinement in Segment Anything Model for Weakly Supervised Object Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4505-4525} }
HARD : Hardware-Aware lightweight Real-time semantic segmentation model Deployable from Edge to GPU-
[pdf]
[supp]
[bibtex]@InProceedings{Kwon_2024_ACCV, author = {Kwon, YoungWook and Kim, WanSoo and Kim, HyunJin}, title = {HARD : Hardware-Aware lightweight Real-time semantic segmentation model Deployable from Edge to GPU}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3552-3569} }
TAPS: Temporal Attention-based Pruning and Scaling for Efficient Video Action Recognition-
[pdf]
[bibtex]@InProceedings{Dinai_2024_ACCV, author = {Dinai, Yonatan and Raviv, Avraham and Harel, Nimrod and Kim, Donghoon and Goldin, Ishay and Zehngut, Niv}, title = {TAPS: Temporal Attention-based Pruning and Scaling for Efficient Video Action Recognition}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3803-3818} }
Vision language models are blind-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rahmanzadehgervi_2024_ACCV, author = {Rahmanzadehgervi, Pooyan and Bolton, Logan and Taesiri, Mohammad Reza and Nguyen, Anh Totti}, title = {Vision language models are blind}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {18-34} }
Bridging the Projection Gap: Overcoming Projection Bias Through Parameterized Distance Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Chong and Jin, Mingyu and Yu, Qinkai and Xue, Haochen and Gowda, Shreyank N and Jin, Xiaobo}, title = {Bridging the Projection Gap: Overcoming Projection Bias Through Parameterized Distance Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3327-3343} }
RD-Diff: RLTransformer-based Diffusion Model with Diversity-Inducing Modulator for Human Motion Prediction-
[pdf]
[supp]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Haosong and Leong, Mei Chee and Li, Liyuan and Lin, Weisi}, title = {RD-Diff: RLTransformer-based Diffusion Model with Diversity-Inducing Modulator for Human Motion Prediction}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3531-3551} }
CCNDF: Curvature Constrained Neural Distance Fields from 3D LiDAR Sequences-
[pdf]
[bibtex]@InProceedings{Singh_2024_ACCV, author = {Singh, Akshit and Bhakuni, Karan and Nagar, Rajendra}, title = {CCNDF: Curvature Constrained Neural Distance Fields from 3D LiDAR Sequences}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {682-698} }
Every Shot Counts: Using Exemplars for Repetition Counting in Videos-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sinha_2024_ACCV, author = {Sinha, Saptarshi and Stergiou, Alexandros and Damen, Dima}, title = {Every Shot Counts: Using Exemplars for Repetition Counting in Videos}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3056-3073} }
Co-Segmentation without any Pixel-level Supervision with Application to Large-Scale Sketch Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ypsilantis_2024_ACCV, author = {Ypsilantis, Nikolaos-Antonios and Chum, Ond\v{r}ej}, title = {Co-Segmentation without any Pixel-level Supervision with Application to Large-Scale Sketch Classification}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1849-1865} }
EffiSeaNet: Pioneering Lightweight Network for Underwater Salient Object Detection-
[pdf]
[bibtex]@InProceedings{Wu_2024_ACCV, author = {Wu, Qingyao and Fu, Zhenqi and Lin, Hong and Ma, Chenyu and Tu, Xiaotong and Ding, Xinghao}, title = {EffiSeaNet: Pioneering Lightweight Network for Underwater Salient Object Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1486-1501} }
Enhanced Super-Resolution Training via Mimicked Alignment for Real-World Scenes-
[pdf]
[arXiv]
[bibtex]@InProceedings{Elezabi_2024_ACCV, author = {Elezabi, Omar and Wu, Zongwei and Timofte, Radu}, title = {Enhanced Super-Resolution Training via Mimicked Alignment for Real-World Scenes}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4122-4140} }
RayEmb: Arbitrary Landmark Detection in X-Ray Images Using Ray Embedding Subspace-
[pdf]
[supp]
[bibtex]@InProceedings{Shrestha_2024_ACCV, author = {Shrestha, Pragyan and Xie, Chun and Yoshii, Yuichi and Kitahara, Itaru}, title = {RayEmb: Arbitrary Landmark Detection in X-Ray Images Using Ray Embedding Subspace}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {665-681} }
FG-CXR: A Radiologist-Aligned Gaze Dataset for Enhancing Interpretability in Chest X-Ray Report Generation-
[pdf]
[bibtex]@InProceedings{Pham_2024_ACCV, author = {Pham, Trong Thang and Ho, Ngoc-Vuong and Bui, Nhat-Tan and Phan, Thinh and Brijesh, Patel and Adjeroh, Donald and Doretto, Gianfranco and Nguyen, Anh and Wu, Carol C. and Nguyen, Hien and Le, Ngan}, title = {FG-CXR: A Radiologist-Aligned Gaze Dataset for Enhancing Interpretability in Chest X-Ray Report Generation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {941-958} }
Learning 2D Human Poses for Better 3D Lifting via Multi-Model 3D-Guidance-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2024_ACCV, author = {Lee, Sanghyeon and Hwang, Yoonho and Lee, Jong Taek}, title = {Learning 2D Human Poses for Better 3D Lifting via Multi-Model 3D-Guidance}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3344-3361} }
Enhancing Photo Animation: Augmented Stylistic Modules and Prior Knowledge Integration-
[pdf]
[supp]
[bibtex]@InProceedings{Lu_2024_ACCV, author = {Lu, Zhanyi and Zhou, Yue and Chen, Ao}, title = {Enhancing Photo Animation: Augmented Stylistic Modules and Prior Knowledge Integration}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1470-1485} }
Sparse Domain Transfer via Elastic Net Regularization-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Jingwei and Farnia, Farzan}, title = {Sparse Domain Transfer via Elastic Net Regularization}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {454-470} }
Redefining Normal: A Novel Object-Level Approach for Multi-Object Novelty Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Salehi_2024_ACCV, author = {Salehi, Mohammadreza and Gavves, Nikolaos Apostolikas Efstratios and Snoek, Cees G. M. and Asano, Yuki M.}, title = {Redefining Normal: A Novel Object-Level Approach for Multi-Object Novelty Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {402-418} }
TranSPORTmer: A Holistic Approach to Trajectory Understanding in Multi-Agent Sports-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Capellera_2024_ACCV, author = {Capellera, Guillem and Ferraz, Luis and Rubio, Antonio and Agudo, Antonio and Moreno-Noguer, Francesc}, title = {TranSPORTmer: A Holistic Approach to Trajectory Understanding in Multi-Agent Sports}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1652-1670} }
Bridging Optimal Transport and Jacobian Regularization by Optimal Trajectory for Enhanced Adversarial Defense-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Le_2024_ACCV, author = {Le, Binh M. and Tariq, Shahroz and Woo, Simon S.}, title = {Bridging Optimal Transport and Jacobian Regularization by Optimal Trajectory for Enhanced Adversarial Defense}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {419-435} }
Guide3D: A Bi-planar X-ray Dataset for Guidewire Segmentation and 3D Reconstruction-
[pdf]
[bibtex]@InProceedings{Jianu_2024_ACCV, author = {Jianu, Tudor and Huang, Baoru and Nguyen, Hoan and Bhattarai, Binod and Do, Tuong and Tjiputra, Erman and Tran, Quang and Berthet-Rayne, Pierre and Le, Ngan and Fichera, Sebastiano and Nguyen, Anh}, title = {Guide3D: A Bi-planar X-ray Dataset for Guidewire Segmentation and 3D Reconstruction}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1549-1565} }
DeBiFormer: Vision Transformer with Deformable Agent Bi-level Routing Attention-
[pdf]
[bibtex]@InProceedings{BaoLong_2024_ACCV, author = {BaoLong, NguyenHuu and Zhang, Chenyu and Shi, Yuzhi and Hirakawa, Tsubasa and Yamashita, Takayoshi and Matsui, Tohgoroh and Fujiyoshi, Hironobu}, title = {DeBiFormer: Vision Transformer with Deformable Agent Bi-level Routing Attention}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4455-4472} }
MGNiceNet: Unified Monocular Geometric Scene Understanding-
[pdf]
[supp]
[bibtex]@InProceedings{Schon_2024_ACCV, author = {Sch\"on, Markus and Buchholz, Michael and Dietmayer, Klaus}, title = {MGNiceNet: Unified Monocular Geometric Scene Understanding}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1502-1519} }
Window-based Channel Attention for Wavelet-enhanced Learned Image Compression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Xu_2024_ACCV, author = {Xu, Heng and Hai, Bowen and Tang, Yushun and He, Zhihai}, title = {Window-based Channel Attention for Wavelet-enhanced Learned Image Compression}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4334-4351} }
Dual Prototype-driven Objectness Decoupling for Cross-Domain Object Detection in Urban Scene-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2024_ACCV, author = {Kim, Taehoon and Na, Jaemin and Hwang, Joong-won and Chang, Hyung Jin and Hwang, Wonjun}, title = {Dual Prototype-driven Objectness Decoupling for Cross-Domain Object Detection in Urban Scene}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1148-1165} }
FOTV-HQS: A Fractional-Order Total Variation Model for LiDAR Super-Resolution with Deep Unfolding Network-
[pdf]
[supp]
[bibtex]@InProceedings{Xi_2024_ACCV, author = {Xi, Huiying and Yuan, Xia and Wu, Shiwei and Geng, Runze and Wang, Kaiyang and Liang, Yongshun and Zhao, Chunxia}, title = {FOTV-HQS: A Fractional-Order Total Variation Model for LiDAR Super-Resolution with Deep Unfolding Network}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4034-4050} }
NT-VOT211: A Large-Scale Benchmark for Night-time Visual Object Tracking-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2024_ACCV, author = {Liu, Yu and Mahmood, Arif and Khan, Muhammad Haris}, title = {NT-VOT211: A Large-Scale Benchmark for Night-time Visual Object Tracking}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {194-212} }
StreamMOTP: Streaming and Unified Framework for Joint 3D Multi-Object Tracking and Trajectory Prediction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhuang_2024_ACCV, author = {Zhuang, Jiaheng and Wang, Guoan and Zhang, Siyu and Wang, Xiyang and Zhou, Hangning and Xu, Ziyao and Zhang, Chi and Li, Zhiheng}, title = {StreamMOTP: Streaming and Unified Framework for Joint 3D Multi-Object Tracking and Trajectory Prediction}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3189-3205} }
3D Adaptive Structural Convolution Network for Domain-Invariant Point Cloud Recognition-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kim_2024_ACCV, author = {Kim, Younggun and Lee, Soomok}, title = {3D Adaptive Structural Convolution Network for Domain-Invariant Point Cloud Recognition}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2002-2017} }
Knowledge Distillation Dealing with Sample-wise Long-tail Problem-
[pdf]
[bibtex]@InProceedings{Yu_2024_ACCV, author = {Yu, Tao and Zhao, Xu and An, Yongqi and Tang, Ming and Wang, Jinqiao}, title = {Knowledge Distillation Dealing with Sample-wise Long-tail Problem}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2354-2370} }
Mamba-based Light Field Super-Resolution with Efficient Subspace Scanning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gao_2024_ACCV, author = {Gao, Ruisheng and Xiao, Zeyu and Xiong, Zhiwei}, title = {Mamba-based Light Field Super-Resolution with Efficient Subspace Scanning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {531-547} }
NewMove: Customizing text-to-video models with novel motions-
[pdf]
[supp]
[bibtex]@InProceedings{Materzynska_2024_ACCV, author = {Materzy\'nska, Joanna and Sivic, Josef and Shechtman, Eli and Torralba, Antonio and Zhang, Richard and Russell, Bryan}, title = {NewMove: Customizing text-to-video models with novel motions}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1634-1651} }
QR-DETR : Query Routing for Detection Transformer-
[pdf]
[bibtex]@InProceedings{Senthivel_2024_ACCV, author = {Senthivel, Tharsan and Vu, Ngoc-Son}, title = {QR-DETR : Query Routing for Detection Transformer}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {354-371} }
SurfOcc: Surface-based Feature Lifting for Vision-centric 3D Occupancy Prediction-
[pdf]
[bibtex]@InProceedings{Ye_2024_ACCV, author = {Ye, Tonghui and Gao, Zhi and Lin, Zhipeng and Liu, Xinyi and Jin, Ronghe}, title = {SurfOcc: Surface-based Feature Lifting for Vision-centric 3D Occupancy Prediction}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2421-2438} }
Hierarchical Prompting for Diffusion Classifiers-
[pdf]
[supp]
[bibtex]@InProceedings{Ning_2024_ACCV, author = {Ning, Wenxin and Chang, Dongliang and Tong, Yujun and He, Zhongjiang and Liang, Kongming and Ma, Zhanyu}, title = {Hierarchical Prompting for Diffusion Classifiers}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1284-1300} }
Enhanced Asymmetric Invertible Network for Neural Video Delivery-
[pdf]
[bibtex]@InProceedings{Tian_2024_ACCV, author = {Tian, Wenbin and Jiang, Qingmiao and Chen, Lu and Li, Haolin and Yan, Jinyao}, title = {Enhanced Asymmetric Invertible Network for Neural Video Delivery}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2751-2766} }
DepthSegNet24: A Label-Free Model for Robust Day-Night Depth and Semantics-
[pdf]
[supp]
[bibtex]@InProceedings{Thanh_2024_ACCV, author = {Thanh, Phan Thi Huyen and Nguyen, The Hiep and Nguyen, Minh Huy Vu and Tran, Trung Thai and Pham, Tran Vu and Nguyen, Duc Dung and Duy, Truong Vinh Truong and Naotake, Natori}, title = {DepthSegNet24: A Label-Free Model for Robust Day-Night Depth and Semantics}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2716-2733} }
DiffLoss: Unleashing Diffusion Model as Constraint for Training Image Restoration Network-
[pdf]
[supp]
[bibtex]@InProceedings{Tan_2024_ACCV, author = {Tan, Jiangtong and Yu, Hu and Huang, Jie and Yang, Zizheng and Zhao, Feng}, title = {DiffLoss: Unleashing Diffusion Model as Constraint for Training Image Restoration Network}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1566-1584} }
3D Prompt Learning for RGB-D Tracking-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2024_ACCV, author = {Li, Bocen and Zhuge, Yunzhi and Jiang, Shan and Wang, Lijun and Wang, Yifan and Lu, Huchuan}, title = {3D Prompt Learning for RGB-D Tracking}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2527-2544} }
TANet: Triplet Attention Network for All-In-One Adverse Weather Image Restoration-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2024_ACCV, author = {Wang, Hsing-Hua and Tsai, Fu-Jen and Lin, Yen-Yu and Lin, Chia-Wen}, title = {TANet: Triplet Attention Network for All-In-One Adverse Weather Image Restoration}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {835-851} }
PMTrack: Multi-object Tracking with Motion-Aware-
[pdf]
[bibtex]@InProceedings{Guo_2024_ACCV, author = {Guo, Xu and Zheng, Yujin and Wang, Dingwen}, title = {PMTrack: Multi-object Tracking with Motion-Aware}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3091-3106} }
Designing Extremely Memory-Efficient CNNs for On-device Vision Tasks-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lee_2024_ACCV, author = {Lee, Jaewook and Park, Yoel and Lee, Seulki}, title = {Designing Extremely Memory-Efficient CNNs for On-device Vision Tasks}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {303-318} }
A Multi-Phase Multi-Graph Approach for Focal Liver Lesion Classification on CT Scans-
[pdf]
[bibtex]@InProceedings{Sam_2024_ACCV, author = {Sam, Tran Bao and Huy, Ta Duc and Dao, Cong Tuyen and Lam, Thanh Tin and Tang, Van Ha and Truong, Steven Q.H.}, title = {A Multi-Phase Multi-Graph Approach for Focal Liver Lesion Classification on CT Scans}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3788-3802} }
A Recipe for CAC: Mosaic-based Generalized Loss for Improved Class-Agnostic Counting-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chou_2024_ACCV, author = {Chou, Tsung-Han and Wang, Brian and Chiu, Wei-Chen and Chen, Jun-Cheng}, title = {A Recipe for CAC: Mosaic-based Generalized Loss for Improved Class-Agnostic Counting}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2906-2921} }
RS-SAM: Integrating Multi-Scale Information for Enhanced Remote Sensing Image Segmentation-
[pdf]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Enkai and Liu, Jingjing and Cao, Anda and Sun, Zhen and Zhang, Haofei and Wang, Huiqiong and Sun, Li and Song, Mingli}, title = {RS-SAM: Integrating Multi-Scale Information for Enhanced Remote Sensing Image Segmentation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {994-1010} }
VIPNet: Combining Viewpoint Information and Shape Priors for Instant Multi-View 3D Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Ye_2024_ACCV, author = {Ye, Weining and Li, Zhixuan and Jiang, Tingting}, title = {VIPNet: Combining Viewpoint Information and Shape Priors for Instant Multi-View 3D Reconstruction}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3379-3395} }
Leveraging Semantic Cues from Foundation Vision Models for Enhanced Local Feature Correspondence-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cadar_2024_ACCV, author = {Cadar, Felipe and Potje, Guilherme and Martins, Renato and Demonceaux, C\'edric and Nascimento, Erickson R.}, title = {Leveraging Semantic Cues from Foundation Vision Models for Enhanced Local Feature Correspondence}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1268-1283} }
SAMIF: Adapting Segment Anything Model for Image Inpainting Forensics-
[pdf]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Lan and Zhu, Xinshan and He, Di and Liao, Xin and Sun, Biao}, title = {SAMIF: Adapting Segment Anything Model for Image Inpainting Forensics}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3605-3621} }
Language-Guided Joint Audio-Visual Editing via One-Shot Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liang_2024_ACCV, author = {Liang, Susan and Huang, Chao and Tian, Yapeng and Kumar, Anurag and Xu, Chenliang}, title = {Language-Guided Joint Audio-Visual Editing via One-Shot Adaptation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1011-1027} }
Faster convergence and Uncorrelated gradients in Self-Supervised Online Continual Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Imai_2024_ACCV, author = {Imai, Koyo and Hayashi, Naoto and Hirakawa, Tsubasa and Yamashita, Takayoshi and Fujiyoshi, Hironobu}, title = {Faster convergence and Uncorrelated gradients in Self-Supervised Online Continual Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {436-453} }
Dynamic Window Transformer for Image Super-Resolution-
[pdf]
[bibtex]@InProceedings{Xie_2024_ACCV, author = {Xie, Zheng and Wang, Zhongxun and Qin, Tianci and Han, Zhexuan and Zhou, Ruoyu}, title = {Dynamic Window Transformer for Image Super-Resolution}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3836-3850} }
Direct Alignment for Robust NeRF Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Garg_2024_ACCV, author = {Garg, Ravi and Chng, Shin-Fang and Lucey, Simon}, title = {Direct Alignment for Robust NeRF Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3947-3963} }
More and Larger Auxiliary Feature-Guided Spatial-Temporal Super-Resolution for Rendered Sequences-
[pdf]
[bibtex]@InProceedings{Zheng_2024_ACCV, author = {Zheng, Lijie and Liang, Xiao}, title = {More and Larger Auxiliary Feature-Guided Spatial-Temporal Super-Resolution for Rendered Sequences}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1986-2001} }
Strike the Balance: On-the-Fly Uncertainty based User Interactions for Long-Term Video Object Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Vujasinovic_2024_ACCV, author = {Vujasinovi\'c, St\'ephane and Becker, Stefan and Bullinger, Sebastian and Scherer-Negenborn, Norbert and Arens, Michael and Stiefelhagen, Rainer}, title = {Strike the Balance: On-the-Fly Uncertainty based User Interactions for Long-Term Video Object Segmentation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2784-2802} }
Unsupervised Video Summarization via Iterative Training and Simplified GAN-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2024_ACCV, author = {Li, Hanqing and Klabjan, Diego and Utke, Jean}, title = {Unsupervised Video Summarization via Iterative Training and Simplified GAN}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1585-1601} }
Generalizable Structure-Aware INF: Biplanar-View CT Reconstruction via Disentangled Implicit Neural Field-
[pdf]
[bibtex]@InProceedings{Huang_2024_ACCV, author = {Huang, Bei and Pei, Yuru}, title = {Generalizable Structure-Aware INF: Biplanar-View CT Reconstruction via Disentangled Implicit Neural Field}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {699-715} }
MECFormer: Multi-task Whole Slide Image Classification with Expert Consultation Network-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bui_2024_ACCV, author = {Bui, Doanh C. and Kwak, Jin Tae}, title = {MECFormer: Multi-task Whole Slide Image Classification with Expert Consultation Network}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1602-1617} }
SRIL: Selective Regularization for Class-Incremental Learning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Han_2024_ACCV, author = {Han, Jisu and Na, Jaemin and Hwang, Wonjun}, title = {SRIL: Selective Regularization for Class-Incremental Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1532-1548} }
DeTurb: Atmospheric Turbulence Mitigation with Deformable 3D Convolutions and 3D Swin Transformers-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zou_2024_ACCV, author = {Zou, Zhicheng and Anantrasirichai, Nantheera}, title = {DeTurb: Atmospheric Turbulence Mitigation with Deformable 3D Convolutions and 3D Swin Transformers}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {904-921} }
DepthBLIP-2: Leveraging Language to Guide BLIP-2 in Understanding Depth Information-
[pdf]
[bibtex]@InProceedings{Chen_2024_ACCV, author = {Chen, Wei and Shi, Changyong and Ma, Chuanxiang and Li, Wenhao and Dong, Shulei}, title = {DepthBLIP-2: Leveraging Language to Guide BLIP-2 in Understanding Depth Information}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2939-2953} }
Learning Neural Radiance Field from Quasi-Uniformly Sampled Spherical Image for Immersive Virtual Reality-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2024_ACCV, author = {Wang, Le and Li, Shigang}, title = {Learning Neural Radiance Field from Quasi-Uniformly Sampled Spherical Image for Immersive Virtual Reality}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1166-1180} }
Strong but simple: A Baseline for Domain Generalized Dense Perception by CLIP-based Transfer Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Hummer_2024_ACCV, author = {H\"ummer, Christoph and Schwonberg, Manuel and Zhou, Liangwei and Cao, Hu and Knoll, Alois and Gottschalk, Hanno}, title = {Strong but simple: A Baseline for Domain Generalized Dense Perception by CLIP-based Transfer Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4223-4244} }
DFIMat: Decoupled Flexible Interactive Matting in Multi-Person Scenarios-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Jiao_2024_ACCV, author = {Jiao, Siyi and Zeng, Wenzheng and Gao, Changxin and Sang, Nong}, title = {DFIMat: Decoupled Flexible Interactive Matting in Multi-Person Scenarios}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2988-3004} }
Multiple active stereo systems calibration method based on Neural SDF using DSSS for wide area 3D reconstruction-
[pdf]
[bibtex]@InProceedings{Nishihara_2024_ACCV, author = {Nishihara, Kota and Furukawa, Ryo and Sagawa, Ryusuke and Kawasaki, Hiroshi}, title = {Multiple active stereo systems calibration method based on Neural SDF using DSSS for wide area 3D reconstruction}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2838-2854} }
S2Net: Skeleton-aware SlowFast Network for Efficient Sign Language Recognition-
[pdf]
[supp]
[bibtex]@InProceedings{Yang_2024_ACCV, author = {Yang, Yifan and Min, Yuecong and Chen, Xilin}, title = {S2Net: Skeleton-aware SlowFast Network for Efficient Sign Language Recognition}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {319-336} }
Rethinking Sampling for Music-Driven Long-Term Dance Generation-
[pdf]
[bibtex]@InProceedings{Truong-Thuy_2024_ACCV, author = {Truong-Thuy, Tuong-Vy and Bui-Le, Gia-Cat and Nguyen, Hai-Dang and Le, Trung-Nghia}, title = {Rethinking Sampling for Music-Driven Long-Term Dance Generation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2667-2683} }
Continual Learning Improves Zero-Shot Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gowda_2024_ACCV, author = {Gowda, Shreyank N and Moltisanti, Davide and Sevilla-Lara, Laura}, title = {Continual Learning Improves Zero-Shot Action Recognition}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3239-3256} }
Semantic Visual-inertial SLAM for Automated Valet Parking-
[pdf]
[bibtex]@InProceedings{Oh_2024_ACCV, author = {Oh, Seungwon and Seo, Junghoon and Park, Jungho and Veera, Viswanath and Felix, Jersha and Menon, Midhun and Shinde, Chinmay}, title = {Semantic Visual-inertial SLAM for Automated Valet Parking}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {733-746} }
Content-Adaptive Style Transfer: A Training-Free Approach with VQ Autoencoders-
[pdf]
[supp]
[bibtex]@InProceedings{Gim_2024_ACCV, author = {Gim, Jongmin and Park, Jihun and Lee, Kyoungmin and Im, Sunghoon}, title = {Content-Adaptive Style Transfer: A Training-Free Approach with VQ Autoencoders}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2337-2353} }
TGCM: Cross-Domain Few-Shot Semantic Segmentation via one-shot Target Guided CutMix-
[pdf]
[bibtex]@InProceedings{Wei_2024_ACCV, author = {Wei, HaiTao and Liu, JianMing and Chen, Tong and Qiu, WenLong}, title = {TGCM: Cross-Domain Few-Shot Semantic Segmentation via one-shot Target Guided CutMix}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1065-1081} }
Latency Attack Resilience in Object Detectors: Insights from Computing Architecture-
[pdf]
[bibtex]@InProceedings{Chen_2024_ACCV, author = {Chen, Erh-Chung and Chen, Pin-Yu and Chung, I-Hsin and Lee, Che-Rung}, title = {Latency Attack Resilience in Object Detectors: Insights from Computing Architecture}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3206-3222} }
Underground Mapping and Localization Based on Ground-Penetrating Radar-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Jinchang and Lu, Guoyu}, title = {Underground Mapping and Localization Based on Ground-Penetrating Radar}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2018-2033} }
Learning 3D Point Cloud Registration as a Single Optimization Problem-
[pdf]
[supp]
[bibtex]@InProceedings{Yanagi_2024_ACCV, author = {Yanagi, Rintaro and Hashimoto, Atsushi and Chiba, Naoya and Sone, Shusaku and Ma, Jiaxin and Ushiku, Yoshitaka}, title = {Learning 3D Point Cloud Registration as a Single Optimization Problem}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3292-3309} }
Amodal Instance Segmentation with Diffusion Shape Prior Estimation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tran_2024_ACCV, author = {Tran, Minh and Vo, Khoa and Nguyen, Tri and Le, Ngan}, title = {Amodal Instance Segmentation with Diffusion Shape Prior Estimation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1181-1196} }
Polyp-SES: Automatic Polyp Segmentation with Self-Enriched Semantic Model-
[pdf]
[bibtex]@InProceedings{Nguyen_2024_ACCV, author = {Nguyen, Quang Vinh and Vo, Thanh Hoang Son and Kang, Sae-Ryung and Kim, Soo-Hyung}, title = {Polyp-SES: Automatic Polyp Segmentation with Self-Enriched Semantic Model}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2803-2819} }
OneDiff: A Generalist Model for Image Difference Captioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Hu_2024_ACCV, author = {Hu, Erdong and Guo, Longteng and Yue, Tongtian and Zhao, Zijia and Xue, Shuning and Liu, Jing}, title = {OneDiff: A Generalist Model for Image Difference Captioning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2439-2455} }
MV2MP: Segmentation Free Performance Capture of Humans in Direct Physical Contact from Sparse Multi-Cam Setups-
[pdf]
[supp]
[bibtex]@InProceedings{Eliseev_2024_ACCV, author = {Eliseev, Sergei and Shtanko, Leonid and Akhunzianov, Rasim and Romanenko, Yaroslav and Starostin, Anatoly}, title = {MV2MP: Segmentation Free Performance Capture of Humans in Direct Physical Contact from Sparse Multi-Cam Setups}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4172-4188} }
Exploiting Cross-modal Cost Volume for Multi-sensor Depth Estimation-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2024_ACCV, author = {Kim, Janghyun and Shin, Ukcheol and Heo, Seokyong and Park, Jinsun}, title = {Exploiting Cross-modal Cost Volume for Multi-sensor Depth Estimation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1420-1436} }
Parameter-Efficient Instance-Adaptive Neural Video Compression-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Oh_2024_ACCV, author = {Oh, Seungjun and Yang, Hyunmo and Park, Eunbyung}, title = {Parameter-Efficient Instance-Adaptive Neural Video Compression}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {250-267} }
Improving Image Clustering with Artifacts Attenuation via Inference-Time Attention Engineering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Nakamura_2024_ACCV, author = {Nakamura, Kazumoto and Nozawa, Yuji and Lin, Yu-Chieh and Nakata, Kengo and Ng, Youyang}, title = {Improving Image Clustering with Artifacts Attenuation via Inference-Time Attention Engineering}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3396-3413} }
Enhanced Kalman with Adaptive Appearance Motion SORT for Grounded Generic Multiple Object Tracking-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Le_Dinh_Anh_2024_ACCV, author = {Le Dinh Anh, Duy and Tran, Kim Hoang and Nguyen, Quang-Thuc and Le, Ngan Hoang}, title = {Enhanced Kalman with Adaptive Appearance Motion SORT for Grounded Generic Multiple Object Tracking}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {145-161} }
LoCo-MAD: Long-Range Context-Enhanced Model Towards Plot-Centric Movie Audio Description-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2024_ACCV, author = {Wang, Jiayi and Liu, Zihao and Wu, Xiaoyu}, title = {LoCo-MAD: Long-Range Context-Enhanced Model Towards Plot-Centric Movie Audio Description}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1366-1383} }
Dual-path Multimodal Optimal Transport for Composed Image Retrieval-
[pdf]
[bibtex]@InProceedings{Yan_2024_ACCV, author = {Yan, Cairong and Ma, Meng and Zhang, Yanting and Wan, Yongquan}, title = {Dual-path Multimodal Optimal Transport for Composed Image Retrieval}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1741-1755} }
EDeRF: Updating Local Scenes and Editing Across Fields for Real-Time Dynamic Reconstruction of Road Scene-
[pdf]
[bibtex]@InProceedings{Liang_2024_ACCV, author = {Liang, Zhaoxiang and Guo, Wenjun and Yang, Yi and Liu, Tong}, title = {EDeRF: Updating Local Scenes and Editing Across Fields for Real-Time Dynamic Reconstruction of Road Scene}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3120-3136} }
Accelerated Deep Nonlinear Dictionary Learning-
[pdf]
[bibtex]@InProceedings{Tan_2024_ACCV, author = {Tan, Benying and Lin, Jie and Qin, Yang and Ding, Shuxue and Li, Yujie}, title = {Accelerated Deep Nonlinear Dictionary Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4439-4454} }
PrimeDepth: Efficient Monocular Depth Estimation with a Stable Diffusion Preimage-
[pdf]
[bibtex]@InProceedings{Zavadski_2024_ACCV, author = {Zavadski, Denis and Kal\v{s}an, Damjan and Rother, Carsten}, title = {PrimeDepth: Efficient Monocular Depth Estimation with a Stable Diffusion Preimage}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {922-940} }
GPNF:A Point Cloud Registration Framework Using Sharp Global Linear Attention Prior and Neighborhood Filtering Strategy-
[pdf]
[supp]
[bibtex]@InProceedings{Zhu_2024_ACCV, author = {Zhu, Congyang and Yin, Mengxiao and Liao, Junjie and Liang, Zhijie and Chang, Kan}, title = {GPNF:A Point Cloud Registration Framework Using Sharp Global Linear Attention Prior and Neighborhood Filtering Strategy}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2489-2506} }
Enhancing Anchor-based Weakly Supervised Referring Expression Comprehension with Cross-Modality Attention-
[pdf]
[bibtex]@InProceedings{Chu_2024_ACCV, author = {Chu, Ting-Yu and Lin, Yong-Xiang and Huang, Ching-Chun and Hua, Kai-Lung}, title = {Enhancing Anchor-based Weakly Supervised Referring Expression Comprehension with Cross-Modality Attention}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2767-2783} }
Deformable Shape-aware Point Generation for 3D Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2024_ACCV, author = {Wang, Kai and Zhang, Xiaowei}, title = {Deformable Shape-aware Point Generation for 3D Object Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2699-2715} }
VideoPatchCore: An Effective Method to Memorize Normality for Video Anomaly Detection-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ahn_2024_ACCV, author = {Ahn, Sunghyun and Jo, Youngwan and Lee, Kijung and Park, Sanghyun}, title = {VideoPatchCore: An Effective Method to Memorize Normality for Video Anomaly Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2179-2195} }
CNG-SFDA: Clean-and-Noisy Region Guided Online-Offline Source-Free Domain Adaptation-
[pdf]
[supp]
[bibtex]@InProceedings{Cho_2024_ACCV, author = {Cho, Hyeonwoo and Park, Chanmin and Kim, Dong-Hee and Kim, Jinyoung and Kim, Won Hwa}, title = {CNG-SFDA: Clean-and-Noisy Region Guided Online-Offline Source-Free Domain Adaptation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1723-1740} }
HT-SSPG:Hierarchical Transformers for Semantic Surface Point Generation in 3D Object Detection-
[pdf]
[bibtex]@InProceedings{Kong_2024_ACCV, author = {Kong, Wenhao and Zhang, Xiaowei}, title = {HT-SSPG:Hierarchical Transformers for Semantic Surface Point Generation in 3D Object Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3672-3688} }
O1O: Grouping of Known Classes to Identify Unknown Objects as Odd-One-Out-
[pdf]
[supp]
[bibtex]@InProceedings{Yavuz_2024_ACCV, author = {Yavuz, M{\i}sra and G\"uney, Fatma}, title = {O1O: Grouping of Known Classes to Identify Unknown Objects as Odd-One-Out}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {614-629} }
Real-SRGD: Enhancing Real-World Image Super-Resolution with Classifier-Free Guided Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Doi_2024_ACCV, author = {Doi, Kenji and Okada, Shuntaro and Yoshihashi, Ryota and Kataoka, Hirokatsu}, title = {Real-SRGD: Enhancing Real-World Image Super-Resolution with Classifier-Free Guided Diffusion}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3739-3755} }
HDNeXt: Hybrid Dynamic MedNeXt with Level Set Regularization for Medical Image Segmentation-
[pdf]
[bibtex]@InProceedings{Cao_2024_ACCV, author = {Cao, Haoyu and Han, Tianyi and Yang, Yunyun}, title = {HDNeXt: Hybrid Dynamic MedNeXt with Level Set Regularization for Medical Image Segmentation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {597-613} }
VIP: Versatile Image Outpainting Empowered by Multimodal Large Language Model-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yang_2024_ACCV, author = {Yang, Jinze and Wang, Haoran and Zhu, Zining and Liu, Chenglong and Wu, Meng and Sun, Mingming}, title = {VIP: Versatile Image Outpainting Empowered by Multimodal Large Language Model}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1082-1099} }
Capture Concept through Comparison: Vision-and-Language Representation Learning with Intrinsic Information Mining-
[pdf]
[bibtex]@InProceedings{Song_2024_ACCV, author = {Song, Yun-Zhu and Chen, Yi-Syuan and Lin, Tzu-Ling and Liu, Bei and Fu, Jianlong and Shuai, Hong-Han}, title = {Capture Concept through Comparison: Vision-and-Language Representation Learning with Intrinsic Information Mining}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4299-4317} }
Image Deraining with Frequency-Enhanced State Space Model-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yamashita_2024_ACCV, author = {Yamashita, Shugo and Ikehara, Masaaki}, title = {Image Deraining with Frequency-Enhanced State Space Model}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3655-3671} }
3D-Aware Instance Segmentation and Tracking in Egocentric Videos-
[pdf]
[arXiv]
[bibtex]@InProceedings{Bhalgat_2024_ACCV, author = {Bhalgat, Yash and Tschernezki, Vadim and Laina, Iro and Henriques, Jo\~ao F. and Vedaldi, Andrea and Zisserman, Andrew}, title = {3D-Aware Instance Segmentation and Tracking in Egocentric Videos}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2562-2578} }
FedRepOpt: Gradient Re-parametrized Optimizers in Federated Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Lau_2024_ACCV, author = {Lau, Kin Wai and Rehman, Yasar Abbas Ur and de Gusm\~ao, Pedro Porto Buarque and Po, Lai-Man and Ma, Lan and Xie, Yuyang}, title = {FedRepOpt: Gradient Re-parametrized Optimizers in Federated Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1866-1882} }
Facing Asymmetry - Uncovering the Causal Link between Facial Symmetry and Expression Classifiers using Synthetic Interventions-
[pdf]
[supp]
[bibtex]@InProceedings{Buchner_2024_ACCV, author = {B\"uchner, Tim and Penzel, Niklas and Guntinas-Lichius, Orlando and Denzler, Joachim}, title = {Facing Asymmetry - Uncovering the Causal Link between Facial Symmetry and Expression Classifiers using Synthetic Interventions}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4100-4121} }
Boosting Few-Shot Detection with Large Language Models and Layout-to-Image Synthesis-
[pdf]
[bibtex]@InProceedings{Abdullah_2024_ACCV, author = {Abdullah, Ahmed and Ebert, Nikolas and Wasenm\"uller, Oliver}, title = {Boosting Few-Shot Detection with Large Language Models and Layout-to-Image Synthesis}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3517-3530} }
Attention4Align: Align Multi-View Parts Via Part2Part Hierarchical Attention Maps for Fine-Grained 3D Object Classification-
[pdf]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Runchu and Yue, Jiahe and Zhang, Zhe and Ma, Jie}, title = {Attention4Align: Align Multi-View Parts Via Part2Part Hierarchical Attention Maps for Fine-Grained 3D Object Classification}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4245-4261} }
Relative pose from cylinder silhouettes-
[pdf]
[bibtex]@InProceedings{Gummeson_2024_ACCV, author = {Gummeson, Anna and Oskarsson, Magnus}, title = {Relative pose from cylinder silhouettes}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2545-2561} }
UAGE: A Supervised Contrastive Method for Unconstrained Adaptive Gaze Estimation-
[pdf]
[bibtex]@InProceedings{Lan_2024_ACCV, author = {Lan, Enfan and Hu, Zhengxi and Liu, Jingtai}, title = {UAGE: A Supervised Contrastive Method for Unconstrained Adaptive Gaze Estimation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2231-2247} }
ReLUifying Smooth Functions: Low-Cost Knowledge Distillation to Obtain High-Performance ReLU Networks-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2024_ACCV, author = {Kim, Soosung and Park, Yeonhong and Lee, Hyunseung and Yi, Sungchan and Lee, Jae W.}, title = {ReLUifying Smooth Functions: Low-Cost Knowledge Distillation to Obtain High-Performance ReLU Networks}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2162-2178} }
Frequency Learning Network with Dual-Guidance Calibration for Camouflaged Object Detection-
[pdf]
[bibtex]@InProceedings{Zhao_2024_ACCV, author = {Zhao, Yilin and Zhang, Qing and Li, Yuetong}, title = {Frequency Learning Network with Dual-Guidance Calibration for Camouflaged Object Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3851-3864} }
Telling Stories for Common Sense Zero-shot Action Recognition-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gowda_2024_ACCV, author = {Gowda, Shreyank N and Sevilla-Lara, Laura}, title = {Telling Stories for Common Sense Zero-shot Action Recognition}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4577-4594} }
Federated Class Incremental Learning: A Pseudo Feature Based Approach Without Exemplars-
[pdf]
[bibtex]@InProceedings{Yoo_2024_ACCV, author = {Yoo, Min Kyoon and Park, Yu Rang}, title = {Federated Class Incremental Learning: A Pseudo Feature Based Approach Without Exemplars}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {488-498} }
Progressive Target Refinement by Self-Distillation for Human Pose Estimation-
[pdf]
[bibtex]@InProceedings{Li_2024_ACCV, author = {Li, Jingtian and Fang, Lin and Wu, Yi and Wang, Shangfei}, title = {Progressive Target Refinement by Self-Distillation for Human Pose Estimation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3934-3946} }
IDDiffuse: Dual-Conditional Diffusion Model for Enhanced Facial Image Anonymization-
[pdf]
[bibtex]@InProceedings{Shaheryar_2024_ACCV, author = {Shaheryar, Muhammad and Lee, Jong Taek and Jung, Soon Ki}, title = {IDDiffuse: Dual-Conditional Diffusion Model for Enhanced Facial Image Anonymization}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4017-4033} }
CrossViT-ReID: Cross-Attention Vision Transformer for Occluded Cloth-Changing Person Re-Identification-
[pdf]
[bibtex]@InProceedings{Nguyen_2024_ACCV, author = {Nguyen, Vuong D. and Mantini, Pranav and Shah, Shishir K.}, title = {CrossViT-ReID: Cross-Attention Vision Transformer for Occluded Cloth-Changing Person Re-Identification}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3982-3999} }
Enhancing 3D Human Pose Estimation with Bone Length Adjustment-
[pdf]
[arXiv]
[bibtex]@InProceedings{Hsu_2024_ACCV, author = {Hsu, Chih-Hsiang and Jang, Jyh-Shing Roger}, title = {Enhancing 3D Human Pose Estimation with Bone Length Adjustment}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3723-3738} }
COCA: Classifier-Oriented Calibration via Textual Prototype for Source-Free Universal Domain Adaptation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Liu_2024_ACCV, author = {Liu, Xinghong and Zhou, Yi}, title = {COCA: Classifier-Oriented Calibration via Textual Prototype for Source-Free Universal Domain Adaptation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1671-1687} }
Enhancing Object Detection in Adverse Weather Conditions through Entropy and Guided Multimodal Fusion-
[pdf]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Zhenrong and Gong, Haoyan and Feng, Yuzheng and Chu, Zixuan and Liu, Hongbin}, title = {Enhancing Object Detection in Adverse Weather Conditions through Entropy and Guided Multimodal Fusion}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2922-2938} }
GReFEL: Geometry-Aware Reliable Facial Expression Learning under Bias and Imbalanced Data Distribution-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wasi_2024_ACCV, author = {Wasi, Azmine Toushik and Rafi, Taki Hasan and Islam, Raima and \v{S}erbetar, Karlo and Chae, Dong-Kyu}, title = {GReFEL: Geometry-Aware Reliable Facial Expression Learning under Bias and Imbalanced Data Distribution}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4368-4384} }
Scene-Adaptive SVAD Based On Multi-modal Action-based Feature Extraction-
[pdf]
[supp]
[bibtex]@InProceedings{Gao_2024_ACCV, author = {Gao, Shibo and Yang, Peipei and Huang, Linlin}, title = {Scene-Adaptive SVAD Based On Multi-modal Action-based Feature Extraction}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2471-2488} }
LoG-VMamba: Local-Global Vision Mamba for Medical Image Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Dang_2024_ACCV, author = {Dang, Trung Dinh Quoc and Nguyen, Huy Hoang and Tiulpin, Aleksei}, title = {LoG-VMamba: Local-Global Vision Mamba for Medical Image Segmentation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {548-565} }
Domain Aware Multi-Task Pre-Training of 3D Swin Transformer for Brain MRI-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2024_ACCV, author = {Kim, Jonghun and Kim, Mansu and Park, Hyunjin}, title = {Domain Aware Multi-Task Pre-Training of 3D Swin Transformer for Brain MRI}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2124-2144} }
CoVLM: Leveraging Consensus from Vision-Language Models for Semi-supervised Multimodal Fake News Detection-
[pdf]
[bibtex]@InProceedings{Devank_2024_ACCV, author = {Devank and Kalla, Jayateja and Biswas, Soma}, title = {CoVLM: Leveraging Consensus from Vision-Language Models for Semi-supervised Multimodal Fake News Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1197-1214} }
Graph Cut-guided Maximal Coding Rate Reduction for Learning Image Embedding and Clustering-
[pdf]
[supp]
[bibtex]@InProceedings{He_2024_ACCV, author = {He, Wei and Huang, Zhiyuan and Meng, Xianghan and Qi, Xianbiao and Xiao, Rong and Li, Chun-Guang}, title = {Graph Cut-guided Maximal Coding Rate Reduction for Learning Image Embedding and Clustering}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1883-1899} }
Tails Tell Tales: Chapter-wide Manga Transcriptions with Character Names-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sachdeva_2024_ACCV, author = {Sachdeva, Ragav and Shin, Gyungin and Zisserman, Andrew}, title = {Tails Tell Tales: Chapter-wide Manga Transcriptions with Character Names}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2053-2069} }
Interaction-Guided Two-Branch Image Dehazing Network-
[pdf]
[arXiv]
[bibtex]@InProceedings{Liu_2024_ACCV, author = {Liu, Huichun and Li, Xiaosong and Tan, Tianshu}, title = {Interaction-Guided Two-Branch Image Dehazing Network}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4069-4084} }
Auxiliary Domain-guided Adaptive Detection in Adverse Weather Conditions-
[pdf]
[bibtex]@InProceedings{Fu_2024_ACCV, author = {Fu, Zhuobin and Chang, Kan and Ling, Mingyang and Zhang, Qingzhi and Qi, Enze}, title = {Auxiliary Domain-guided Adaptive Detection in Adverse Weather Conditions}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3964-3981} }
OccFusion: Depth Estimation Free Multi-sensor Fusion for 3D Occupancy Prediction-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Ji and Ding, Yiran and Liu, Zixin}, title = {OccFusion: Depth Estimation Free Multi-sensor Fusion for 3D Occupancy Prediction}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3587-3604} }
Diffusion-based Multimodal Video Captioning-
[pdf]
[supp]
[bibtex]@InProceedings{Kainulainen_2024_ACCV, author = {Kainulainen, Jaakko and Guo, Zixin and Laaksonen, Jorma}, title = {Diffusion-based Multimodal Video Captioning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2820-2837} }
Estimating Soil Organic Carbon from Multispectral Images using Physics-Informed Neural Networks-
[pdf]
[bibtex]@InProceedings{Sargeant_2024_ACCV, author = {Sargeant, James and Teng, Shyh Wei and Murshed, Manzur and Paul, Manoranjan and Brennan, David}, title = {Estimating Soil Organic Carbon from Multispectral Images using Physics-Informed Neural Networks}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2632-2649} }
RNA: Video Editing with ROI-based Neural Atlas-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lee_2024_ACCV, author = {Lee, Jaekyeong and Kim, Geonung and Cho, Sunghyun}, title = {RNA: Video Editing with ROI-based Neural Atlas}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1936-1951} }
Masking Cascaded Self-Attentions for Few-Shot Font-Generation Transformer-
[pdf]
[supp]
[bibtex]@InProceedings{Ma_2024_ACCV, author = {Ma, Jing and Xiang, Xiang and He, Yan}, title = {Masking Cascaded Self-Attentions for Few-Shot Font-Generation Transformer}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2734-2750} }
PixMamba: Leveraging State Space Models in a Dual-Level Architecture for Underwater Image Enhancement-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lin_2024_ACCV, author = {Lin, Wei-Tung and Lin, Yong-Xiang and Chen, Jyun-Wei and Hua, Kai-Lung}, title = {PixMamba: Leveraging State Space Models in a Dual-Level Architecture for Underwater Image Enhancement}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3622-3637} }
OneBEV: Using One Panoramic Image for Bird,Aos-Eye-View Semantic Mapping-
[pdf]
[bibtex]@InProceedings{Wei_2024_ACCV, author = {Wei, Jiale and Zheng, Junwei and Liu, Ruiping and Hu, Jie and Zhang, Jiaming and Stiefelhagen, Rainer}, title = {OneBEV: Using One Panoramic Image for Bird,Aos-Eye-View Semantic Mapping}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {583-596} }
Seamless-Through-Breaking: Rethinking Image Stitching for Optimal Alignment-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2024_ACCV, author = {Chen, KuanYan and Garg, Atik and Wang, Yu-Shuen}, title = {Seamless-Through-Breaking: Rethinking Image Stitching for Optimal Alignment}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4352-4367} }
Spatiotemporal Pooling on Appropriate Topological Maps Represented as Two-Dimensional Images for EEG Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Fukushima_2024_ACCV, author = {Fukushima, Takuto and Miyamoto, Ryusuke}, title = {Spatiotemporal Pooling on Appropriate Topological Maps Represented as Two-Dimensional Images for EEG Classification}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1401-1419} }
TexDC: Text-Driven Disease-Aware 4D Cardiac Cine MRI Images Generation-
[pdf]
[bibtex]@InProceedings{Liu_2024_ACCV, author = {Liu, Cong and Yuan, Xiaohan and Yu, ZhiPeng and Wang, Yangang}, title = {TexDC: Text-Driven Disease-Aware 4D Cardiac Cine MRI Images Generation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3005-3021} }
4DPV: 4D Pet from Videos by Coarse-to-Fine Non-Rigid Radiance Fields-
[pdf]
[arXiv]
[bibtex]@InProceedings{de_Paco_2024_ACCV, author = {de Paco, Sergio M. and Agudo, Antonio}, title = {4DPV: 4D Pet from Videos by Coarse-to-Fine Non-Rigid Radiance Fields}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2596-2612} }
A computational model for color assimilation illusions and color constancy-
[pdf]
[supp]
[bibtex]@InProceedings{Ulucan_2024_ACCV, author = {Ulucan, Oguzhan and Ulucan, Diclehan and Ebner, Marc}, title = {A computational model for color assimilation illusions and color constancy}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {630-647} }
TaE: Task-aware Expandable Representation for Long Tail Class Incremental Learning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Li_2024_ACCV, author = {Li, Linjie and Wu, Zhenyu and Liu, Jiaming and Ji, Yang}, title = {TaE: Task-aware Expandable Representation for Long Tail Class Incremental Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3917-3933} }
Feature Generator for Few-Shot Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kanagalingam_2024_ACCV, author = {Kanagalingam, Heethanjan and Pathmanathan, Thenukan and Ketheeswaran, Navaneethan and Vathanakumar, Mokeeshan and Afham, Mohamed and Rodrigo, Ranga}, title = {Feature Generator for Few-Shot Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3901-3916} }
SeSame: Simple, Easy 3D Object Detection with Point-Wise Semantics-
[pdf]
[arXiv]
[bibtex]@InProceedings{O_2024_ACCV, author = {O, Hayeon and Yang, Chanuk and Huh, Kunsoo}, title = {SeSame: Simple, Easy 3D Object Detection with Point-Wise Semantics}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2889-2905} }
Act Like a Radiologist: Radiology Report Generation across Anatomical Regions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2024_ACCV, author = {Chen, Qi and Xie, Yutong and Wu, Biao and Chen, Xiaomin and Ang, James and To, Minh-Son and Chang, Xiaojun and Wu, Qi}, title = {Act Like a Radiologist: Radiology Report Generation across Anatomical Regions}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1-17} }
PlainUSR: Chasing Faster ConvNet for Efficient Super-Resolution-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2024_ACCV, author = {Wang, Yan and Li, Yusen and Wang, Gang and Liu, Xiaoguang}, title = {PlainUSR: Chasing Faster ConvNet for Efficient Super-Resolution}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4262-4279} }
VIFA: An Efficient Visible and Infrared Image Fusion Architecture for Multi-task Applications via Continual Learning-
[pdf]
[bibtex]@InProceedings{Shi_2024_ACCV, author = {Shi, Jiaxing and Ren, Ao and Zhuang, Wei and Hua, Yang and Qin, ZhiYong and Wang, Zhenyu and Song, Yang and Tan, Yujuan and Liu, Duo}, title = {VIFA: An Efficient Visible and Infrared Image Fusion Architecture for Multi-task Applications via Continual Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2872-2888} }
TCL-Net: A Lightweight and Efficient Dehazing Network with Frequency-Domain Fusion and Multi-Angle Attention-
[pdf]
[bibtex]@InProceedings{Tang_2024_ACCV, author = {Tang, Cheng and Lou, Wenqi}, title = {TCL-Net: A Lightweight and Efficient Dehazing Network with Frequency-Domain Fusion and Multi-Angle Attention}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {566-582} }
Blind Super Resolution with Reference Images and Implicit Degradation Representation-
[pdf]
[supp]
[bibtex]@InProceedings{Do_2024_ACCV, author = {Do, Huu-Phu and Hu, Po-Chih and Hsueh, Hao-Chien and Liu, Che-Kai and Tran, Vu-Hoang and Huang, Ching-Chun}, title = {Blind Super Resolution with Reference Images and Implicit Degradation Representation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1100-1115} }
DA^2: Degree-Accumulated Data Augmentation on Point Clouds with Curriculum Dynamic Threshold Selection-
[pdf]
[supp]
[bibtex]@InProceedings{Tai_2024_ACCV, author = {Tai, Ta Chun and Do-Tran, Nhat-Tuong and Le, Ngoc-Hoang-Lam and Li, Yung-Hui and Huang, Ching-Chun}, title = {DA{\textasciicircum}2: Degree-Accumulated Data Augmentation on Point Clouds with Curriculum Dynamic Threshold Selection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2196-2211} }
FaRE: A Feature-aware Radical Encoding Strategy for Zero-shot Chinese Character Recognition-
[pdf]
[bibtex]@InProceedings{Zhan_2024_ACCV, author = {Zhan, Hongjian and Li, Yangfu and Xiong, Yu-jie and Lu, Yue}, title = {FaRE: A Feature-aware Radical Encoding Strategy for Zero-shot Chinese Character Recognition}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {390-401} }
KEM: SGW-based Multi-Task Learning in Vision Tasks-
[pdf]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Ruiyuan and Chen, Yuyao and Liu, Jiaxiang and Xi, Dianbing and Huo, Yuchi and Liu, Jie and Wu, Chao}, title = {KEM: SGW-based Multi-Task Learning in Vision Tasks}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1688-1705} }
It's Just Another Day: Unique Video Captioning by Discriminative Prompting-
[pdf]
[supp]
[bibtex]@InProceedings{Perrett_2024_ACCV, author = {Perrett, Toby and Han, Tengda and Damen, Dima and Zisserman, Andrew}, title = {It's Just Another Day: Unique Video Captioning by Discriminative Prompting}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {232-249} }
Learning Classwise Untangled Continuums for Conditional Normalizing Flows-
[pdf]
[supp]
[bibtex]@InProceedings{Enescu_2024_ACCV, author = {Enescu, Victor and Sahbi, Hichem}, title = {Learning Classwise Untangled Continuums for Conditional Normalizing Flows}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3038-3055} }
Full-body Human De-lighting with Semi-Supervised Learning-
[pdf]
[bibtex]@InProceedings{Weir_2024_ACCV, author = {Weir, Joshua and Zhao, Junhong and Chalmers, Andrew and Rhee, Taehyun}, title = {Full-body Human De-lighting with Semi-Supervised Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {648-664} }
Parameter-Selective Continual Test-Time Adaptation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tian_2024_ACCV, author = {Tian, Jiaxu and Lyu, Fan}, title = {Parameter-Selective Continual Test-Time Adaptation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1384-1400} }
EDAF: Early Detection of Atrial Fibrillation from Post-Stroke Brain MRI-
[pdf]
[bibtex]@InProceedings{Shokri_2024_ACCV, author = {Shokri, Mohammad Javad and Desai, Nandakishor and Rao, Aravinda S. and Sharobeam, Angelos and Yan, Bernard and Palaniswami, Marimuthu}, title = {EDAF: Early Detection of Atrial Fibrillation from Post-Stroke Brain MRI}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1969-1985} }
Chinese Character Component Segmentation Based on Character Structure Masks-
[pdf]
[bibtex]@InProceedings{Li_2024_ACCV, author = {Li, Haiyan and Yang, Fang}, title = {Chinese Character Component Segmentation Based on Character Structure Masks}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1316-1331} }
MeshGS: Adaptive Mesh-Aligned Gaussian Splatting for High-Quality Rendering-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Choi_2024_ACCV, author = {Choi, Jaehoon and Lee, Yonghan and Lee, Hyungtae and Kwon, Heesung and Manocha, Dinesh}, title = {MeshGS: Adaptive Mesh-Aligned Gaussian Splatting for High-Quality Rendering}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3310-3326} }
Learning Interval-Aware Embedding for Macro- and Micro-expression Spotting-
[pdf]
[bibtex]@InProceedings{Li_2024_ACCV, author = {Li, Xiaodong and Li, Jiajun and Du, Wenchao and Chen, Hu and Yang, Hongyu}, title = {Learning Interval-Aware Embedding for Macro- and Micro-expression Spotting}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {337-353} }
Learning Complementary Maps for Light Field Salient Object Detection-
[pdf]
[supp]
[bibtex]@InProceedings{Xiao_2024_ACCV, author = {Xiao, Zeyu and Shou, Jiateng and Xiong, Zhiwei}, title = {Learning Complementary Maps for Light Field Salient Object Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4403-4421} }
MS-UMLP: Medical Image Segmentation via Multi-Scale U-shape MLP-Mixer-
[pdf]
[bibtex]@InProceedings{Xie_2024_ACCV, author = {Xie, Bin and Tang, Hao and Cai, Dawen and Yan, Yan}, title = {MS-UMLP: Medical Image Segmentation via Multi-Scale U-shape MLP-Mixer}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1793-1808} }
A StyleCLIP-based Facial Emotion Manipulation Method for Discrepant Emotion Transitions-
[pdf]
[bibtex]@InProceedings{Guo_2024_ACCV, author = {Guo, Qi and Gu, Xiaodong}, title = {A StyleCLIP-based Facial Emotion Manipulation Method for Discrepant Emotion Transitions}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3414-3431} }
Few Exemplar-Based General Medical Image Segmentation via Domain-Aware Selective Adaptation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xu_2024_ACCV, author = {Xu, Chen and Huang, Qiming and Hou, Yuqi and Wu, Jiangxing and Zhang, Fan and Chang, Hyung Jin and Jiao, Jianbo}, title = {Few Exemplar-Based General Medical Image Segmentation via Domain-Aware Selective Adaptation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2684-2698} }
Tracking Reflected Objects: A Benchmark-
[pdf]
[arXiv]
[bibtex]@InProceedings{Guo_2024_ACCV, author = {Guo, Xiaoyu and Zhong, Pengzhi and Lin, Lizhi and Zhang, Hao and Huang, Ling and Li, Shuiwang}, title = {Tracking Reflected Objects: A Benchmark}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1756-1776} }
CrossPAR: Enhancing Pedestrian Attribute Recognition with Vision-Language Fusion and Human-Centric Pre-training-
[pdf]
[bibtex]@InProceedings{Ngo_2024_ACCV, author = {Ngo, Bach-Hoang and Ngo, Si-Tri and Le, Phu-Duc and Phan, Quang-Minh and Tran, Minh-Triet and Le, Trung-Nghia}, title = {CrossPAR: Enhancing Pedestrian Attribute Recognition with Vision-Language Fusion and Human-Centric Pre-training}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1301-1315} }
GSMNet: Towards Long-term Trajectory Prediction by Integrating Multi-Scale Information-
[pdf]
[bibtex]@InProceedings{Liu_2024_ACCV, author = {Liu, Shaohua and Wang, Yisu and Zhu, Yinglong and Yao, Pengfei and Mao, Tianlu and Wang, Zhaoqi}, title = {GSMNet: Towards Long-term Trajectory Prediction by Integrating Multi-Scale Information}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2954-2969} }
Structure-Centric Robust Monocular Depth Estimation via Knowledge Distillation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2024_ACCV, author = {Chen, Runze and Luo, Haiyong and Zhao, Fang and Yu, Jingze and Jia, Yupeng and Wang, Juan and Ma, Xuepeng}, title = {Structure-Centric Robust Monocular Depth Estimation via Knowledge Distillation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2970-2987} }
High-Quality Visually-Guided Sound Separation from Diverse Categories-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huang_2024_ACCV, author = {Huang, Chao and Liang, Susan and Tian, Yapeng and Kumar, Anurag and Xu, Chenliang}, title = {High-Quality Visually-Guided Sound Separation from Diverse Categories}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {35-49} }
FSGait: Fine Grained Self-Supervised Gait Abnormality Detection-
[pdf]
[bibtex]@InProceedings{Duan_2024_ACCV, author = {Duan, Bingzhi and Wan, Xiaoyue and Zhao, Xu}, title = {FSGait: Fine Grained Self-Supervised Gait Abnormality Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2248-2264} }
Spotlight on Small-scale Ship Detection: Empowering YOLO with Advanced Techniques and a Novel Dataset-
[pdf]
[supp]
[bibtex]@InProceedings{Li_2024_ACCV, author = {Li, Lingya and Hou, Zhixing and Ma, Ming and Xiang, Jing and Yuan, Chuangxin and Xia, Guihua}, title = {Spotlight on Small-scale Ship Detection: Empowering YOLO with Advanced Techniques and a Novel Dataset}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {784-799} }
Foundation Model-Powered 3D Few-Shot Class Incremental Learning via Training-free Adaptor-
[pdf]
[arXiv]
[bibtex]@InProceedings{Ahmadi_2024_ACCV, author = {Ahmadi, Sahar and Cheraghian, Ali and Saberi, Morteza and Abir, Md.Towsif and Dastmalchi, Hamidreza and Hussain, Farookh and Rahman, Shafin}, title = {Foundation Model-Powered 3D Few-Shot Class Incremental Learning via Training-free Adaptor}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2282-2299} }
Calibration Transfer via Knowledge Distillation-
[pdf]
[supp]
[bibtex]@InProceedings{Hebbalaguppe_2024_ACCV, author = {Hebbalaguppe, Ramya and Baranwal, Mayank and Anand, Kartik and Arora, Chetan}, title = {Calibration Transfer via Knowledge Distillation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {513-530} }
TuneVLSeg: Prompt Tuning Benchmark for Vision-Language Segmentation Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Adhikari_2024_ACCV, author = {Adhikari, Rabin and Thapaliya, Safal and Dhakal, Manish and Khanal, Bishesh}, title = {TuneVLSeg: Prompt Tuning Benchmark for Vision-Language Segmentation Models}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {126-144} }
DENEB: A Hallucination-Robust Automatic Evaluation Metric for Image Captioning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Matsuda_2024_ACCV, author = {Matsuda, Kazuki and Wada, Yuiga and Sugiura, Komei}, title = {DENEB: A Hallucination-Robust Automatic Evaluation Metric for Image Captioning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3570-3586} }
EgoCoord: Self-calibrated Egocentric 3D Body Pose Estimation using Pixel-wise Coordinate Encoding-
[pdf]
[bibtex]@InProceedings{Lee_2024_ACCV, author = {Lee, Jong-Bae and Lee, Hyoung and Lee, Beom-Ryeol and Lee, Byung-Gook and Son, Wook-Ho}, title = {EgoCoord: Self-calibrated Egocentric 3D Body Pose Estimation using Pixel-wise Coordinate Encoding}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1233-1249} }
Match-free Inbetweening Assistant (MIBA): A Practical Animation Tool without User Stroke Correspondence-
[pdf]
[bibtex]@InProceedings{Chen_2024_ACCV, author = {Chen, Shuhong and Zwicker, Matthias}, title = {Match-free Inbetweening Assistant (MIBA): A Practical Animation Tool without User Stroke Correspondence}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {179-193} }
LCM: Log Conformal Maps for Robust Representation Learning to Mitigate Perspective Distortion-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chippa_2024_ACCV, author = {Chippa, Meenakshi Subhash and Chhipa, Prakash Chandra and De, Kanjar and Liwicki, Marcus and Saini, Rajkumar}, title = {LCM: Log Conformal Maps for Robust Representation Learning to Mitigate Perspective Distortion}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3275-3291} }
Reference-Based Face Super-Resolution Using the Spatial Transformer-
[pdf]
[bibtex]@InProceedings{Jois_2024_ACCV, author = {Jois, Varun Ramesh and DiLillo, Antonella and Storer, James}, title = {Reference-Based Face Super-Resolution Using the Spatial Transformer}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3689-3705} }
Tracking Correction Method for Rapid and Random Protein Molecules Movement-
[pdf]
[bibtex]@InProceedings{Kamiya_2024_ACCV, author = {Kamiya, Satoshi and Toida, Keisuke and Tsunoyama, Taka-aki and Hotta, Kazuhiro}, title = {Tracking Correction Method for Rapid and Random Protein Molecules Movement}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3022-3037} }
PSG-Adapter: Controllable Planning Scene Graph for Improving Text-to-Image Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Gao_2024_ACCV, author = {Gao, Yi}, title = {PSG-Adapter: Controllable Planning Scene Graph for Improving Text-to-Image Diffusion}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2371-2387} }
BoT-FaceSORT: Bag-of-Tricks for Robust Multi-Face Tracking in Unconstrained Videos-
[pdf]
[supp]
[bibtex]@InProceedings{Kim_2024_ACCV, author = {Kim, Jonghyeon and Ju, Chan-Yang and Kim, Gun-Woo and Lee, Dong-Ho}, title = {BoT-FaceSORT: Bag-of-Tricks for Robust Multi-Face Tracking in Unconstrained Videos}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1437-1453} }
ADSP: Advanced Dataset for Shadow Processing, enabling visible occluders via synthesizing strategy.-
[pdf]
[supp]
[bibtex]@InProceedings{Hsieh_2024_ACCV, author = {Hsieh, Chang-Yu and Ding, Jian-Jiun}, title = {ADSP: Advanced Dataset for Shadow Processing, enabling visible occluders via synthesizing strategy.}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1028-1045} }
ObjectCompose: Evaluating Resilience of Vision-Based Models on Object-to-Background Compositional Changes-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Malik_2024_ACCV, author = {Malik, Hashmat Shadab and Huzaifa, Muhammad and Naseer, Muzammal and Khan, Salman and Khan, Fahad Shahbaz}, title = {ObjectCompose: Evaluating Resilience of Vision-Based Models on Object-to-Background Compositional Changes}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {372-389} }
Feature Estimation of Global Language Processing in EEG Using Attention Maps-
[pdf]
[arXiv]
[bibtex]@InProceedings{Shimizu_2024_ACCV, author = {Shimizu, Dai and Watanabe, Ko and Dengel, Andreas}, title = {Feature Estimation of Global Language Processing in EEG Using Attention Maps}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1706-1722} }
Efficient Implicit SDF and Color Reconstruction via Shared Feature Field-
[pdf]
[bibtex]@InProceedings{Fang_2024_ACCV, author = {Fang, Shuangkang and Qi, Dacheng and Xu, Weixin and Wang, Yufeng and Zhang, Zehao and Zhang, Xiaorong and Zhang, Huayu and Shao, Zeqi and Ding, Wenrui}, title = {Efficient Implicit SDF and Color Reconstruction via Shared Feature Field}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3499-3516} }
BAMG: Text-based Person Re-identification via Bottlenecks Attention and Masked Graph Modeling-
[pdf]
[bibtex]@InProceedings{Cheng_2024_ACCV, author = {Cheng, Keyang and Zou, Wenxuan and Gu, Hongjian and Ouyang, Anxiang}, title = {BAMG: Text-based Person Re-identification via Bottlenecks Attention and Masked Graph Modeling}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1809-1826} }
Nash Meets Wertheimer: Using Good Continuation in Jigsaw Puzzles-
[pdf]
[arXiv]
[bibtex]@InProceedings{Khoroshiltseva_2024_ACCV, author = {Khoroshiltseva, Marina and Palmieri, Luca and Aslan, Sinem and Vascon, Sebastiano and Pelillo, Marcello}, title = {Nash Meets Wertheimer: Using Good Continuation in Jigsaw Puzzles}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3223-3238} }
A Simple Finetuning Strategy Based on Bias-Variance Ratios of Layer-Wise Gradients-
[pdf]
[bibtex]@InProceedings{Tomita_2024_ACCV, author = {Tomita, Mao and Sato, Ikuro and Kawakami, Rei and Inoue, Nakamasa and Ikehata, Satoshi and Tanaka, Masayuki}, title = {A Simple Finetuning Strategy Based on Bias-Variance Ratios of Layer-Wise Gradients}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {471-487} }
Adapting Models to Scarce Target Data without Source Samples-
[pdf]
[supp]
[bibtex]@InProceedings{Lee_2024_ACCV, author = {Lee, JoonHo and Lee, Gyemin}, title = {Adapting Models to Scarce Target Data without Source Samples}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1618-1633} }
SSTHyper: Sparse Spectral Transformer for Hyperspectral Image Reconstruction-
[pdf]
[bibtex]@InProceedings{Xu_2024_ACCV, author = {Xu, Meng and Lin, Mingying and Ren, Qi and Jia, Sen}, title = {SSTHyper: Sparse Spectral Transformer for Hyperspectral Image Reconstruction}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1918-1935} }
Conditional Distribution Modelling for Few-Shot Image Synthesis with Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Gupta_2024_ACCV, author = {Gupta, Parul and Hayat, Munawar and Dhall, Abhinav and Do, Thanh-Toan}, title = {Conditional Distribution Modelling for Few-Shot Image Synthesis with Diffusion Models}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {818-834} }
The Devil is in the Details: Simple Remedies for Image-to-LiDAR Representation Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Jo_2024_ACCV, author = {Jo, Wonjun and Byung-Ki, Kwon and Ji-Yeon, Kim and Jeong, Hawook and Joo, Kyungdon and Oh, Tae-Hyun}, title = {The Devil is in the Details: Simple Remedies for Image-to-LiDAR Representation Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3172-3188} }
SCCA-Net: A Novel Network for Image Manipulation Localization Using Split-Channel Contextual Attention-
[pdf]
[bibtex]@InProceedings{Xiang_2024_ACCV, author = {Xiang, Yan and Zhao, Kaiqi and Yin, Haichang}, title = {SCCA-Net: A Novel Network for Image Manipulation Localization Using Split-Channel Contextual Attention}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4473-4487} }
Revealing Hidden Context in Camouflage Instance Segmentation-
[pdf]
[supp]
[bibtex]@InProceedings{Phung_2024_ACCV, author = {Phung, Thanh-Hai and Shuai, Hong-Han}, title = {Revealing Hidden Context in Camouflage Instance Segmentation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2319-2336} }
Dessie: Disentanglement for Articulated 3D Horse Shape and Pose Estimation from Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2024_ACCV, author = {Li, Ci and Yang, Yi and Weng, Zehang and Hernlund, Elin and Zuffi, Silvia and Kjellstr\"om, Hedvig}, title = {Dessie: Disentanglement for Articulated 3D Horse Shape and Pose Estimation from Images}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {764-783} }
Greit-HRNet: Grouped Lightweight High-Resolution Network for Human Pose Estimation-
[pdf]
[bibtex]@InProceedings{Han_2024_ACCV, author = {Han, Junjia and Wang, Yanxia}, title = {Greit-HRNet: Grouped Lightweight High-Resolution Network for Human Pose Estimation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3771-3787} }
Improve Model Robustness in Less Time Than It Takes to Drink A Cup of Coffee with Plug-and-Play Plugins.-
[pdf]
[bibtex]@InProceedings{Fang_2024_ACCV, author = {Fang, Jiang and Zhang, Zhicheng and Sun, Jiyan and Fu, Jiadong and He, Haonan and Liu, Yinlong and Ma, Wei}, title = {Improve Model Robustness in Less Time Than It Takes to Drink A Cup of Coffee with Plug-and-Play Plugins.}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1520-1531} }
Locate n' Rotate: Two-stage Openable Part Detection with Geometric Foundation Model Priors-
[pdf]
[bibtex]@InProceedings{Li_2024_ACCV, author = {Li, Siqi and Chen, Xiaoxue and Cheng, Haoyu and Zhou, Guyue and Zhao, Hao and Tian, Guanzhong}, title = {Locate n' Rotate: Two-stage Openable Part Detection with Geometric Foundation Model Priors}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {716-732} }
Character-aware audio-visual subtitling in context-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Huh_2024_ACCV, author = {Huh, Jaesung and Zisserman, Andrew}, title = {Character-aware audio-visual subtitling in context}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2613-2631} }
A Generic Autoregressive Predictive Feedback Framework for Skeleton-Based Action Recognition-
[pdf]
[bibtex]@InProceedings{Yin_2024_ACCV, author = {Yin, Xinpeng and Hu, Jing and Cao, Wenming}, title = {A Generic Autoregressive Predictive Feedback Framework for Skeleton-Based Action Recognition}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3465-3479} }
Exploring Limits of Diffusion-Synthetic Training with Weakly Supervised Semantic Segmentation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yoshihashi_2024_ACCV, author = {Yoshihashi, Ryota and Otsuka, Yuya and Doi, Kenji and Tanaka, Tomohiro and Kataoka, Hirokatsu}, title = {Exploring Limits of Diffusion-Synthetic Training with Weakly Supervised Semantic Segmentation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2300-2318} }
ESM-YOLO: Enhanced Small Target Detection Based on Visible and Infrared Multi-modal Fusion-
[pdf]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Qianqian and Qiu, Linwei and Zhou, Li and An, Junshe}, title = {ESM-YOLO: Enhanced Small Target Detection Based on Visible and Infrared Multi-modal Fusion}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1454-1469} }
Diffusing Background Dictionary for Hyperspectral Anomaly Detection-
[pdf]
[bibtex]@InProceedings{Wu_2024_ACCV, author = {Wu, Yaochen and Meng, Yu and Sun, Lei}, title = {Diffusing Background Dictionary for Hyperspectral Anomaly Detection}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1046-1064} }
Robust Single-view 3D Human Digitization via Explicit Geometric Field with Semantic Guidance-
[pdf]
[bibtex]@InProceedings{Liu_2024_ACCV, author = {Liu, Ruizhi and Remagnino, Paolo}, title = {Robust Single-view 3D Human Digitization via Explicit Geometric Field with Semantic Guidance}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3362-3378} }
Learning Dual Hierarchical Representation for 3D Surface Reconstruction-
[pdf]
[supp]
[bibtex]@InProceedings{Shin_2024_ACCV, author = {Shin, Jiyoon and Kim, Youngwook and Hong, Sangwoo and Lee, Jungwoo}, title = {Learning Dual Hierarchical Representation for 3D Surface Reconstruction}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4422-4438} }
Joint Image Super-resolution and Low-light Enhancement in the Dark-
[pdf]
[supp]
[bibtex]@InProceedings{Zhou_2024_ACCV, author = {Zhou, Feihu and Chang, Kan and Ling, Mingyang and Li, Hengxin and Xia, Shucheng}, title = {Joint Image Super-resolution and Low-light Enhancement in the Dark}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1332-1349} }
Beyond Coarse-Grained Matching in Video-Text Retrieval-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2024_ACCV, author = {Chen, Aozhu and Doughty, Hazel and Li, Xirong and Snoek, Cees G. M.}, title = {Beyond Coarse-Grained Matching in Video-Text Retrieval}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {71-87} }
UNet--: Memory-Efficient and Feature-Enhanced Network Architecture based on U-Net with Reduced Skip-Connections-
[pdf]
[bibtex]@InProceedings{Yin_2024_ACCV, author = {Yin, Lingxiao and Tao, Wei and Zhao, Dongyue and Ito, Tadayuki and Osa, Kinya and Kato, Masami and Chen, Tse-Wei}, title = {UNet--: Memory-Efficient and Feature-Enhanced Network Architecture based on U-Net with Reduced Skip-Connections}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4085-4099} }
Enhancing Multimedia Applications by Removing Dynamic Objects in Neural Radiance Fields-
[pdf]
[bibtex]@InProceedings{Yang_2024_ACCV, author = {Yang, XianBen and Wang, Tao and Liu, He and Jin, Yi and Lang, Congyan and Li, Yidong}, title = {Enhancing Multimedia Applications by Removing Dynamic Objects in Neural Radiance Fields}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2070-2086} }
Revisiting sample weights based method for noisy-label detection and classification-
[pdf]
[bibtex]@InProceedings{Hoang_2024_ACCV, author = {Hoang, Tuan and Tran, Hung and Rana, Santu and Gupta, Sunil and Venkatesh, Svetha}, title = {Revisiting sample weights based method for noisy-label detection and classification}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4189-4204} }
Enhancing Robustness to Noise Corruption for Point Cloud Recognition via Spatial Sorting and Set-Mixing Aggregation Module-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Dingxin and Yu, Jianhui and Xue, Tengfei and Zhang, Chaoyi and Liu, Dongnan and Cai, Weidong}, title = {Enhancing Robustness to Noise Corruption for Point Cloud Recognition via Spatial Sorting and Set-Mixing Aggregation Module}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4205-4222} }
Hybrid and Non-minimal Planar Motion Estimation from Point Correspondences-
[pdf]
[supp]
[bibtex]@InProceedings{Simental_2024_ACCV, author = {Simental, Juan Carlos Dibene and Dunn, Enrique}, title = {Hybrid and Non-minimal Planar Motion Estimation from Point Correspondences}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4561-4576} }
Text Query to Web Image to Video: A Comprehensive Ad-hoc Video Search-
[pdf]
[supp]
[bibtex]@InProceedings{Nguyen_2024_ACCV, author = {Nguyen, Nhat-Minh and Mai, Tien-Dung and Le, Duy-Dinh}, title = {Text Query to Web Image to Video: A Comprehensive Ad-hoc Video Search}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4141-4155} }
GeoRefineNet: A Multistage Framework for Enhanced Cephalometric Landmark Detection in CBCT Images Using 3D Geometric Information-
[pdf]
[bibtex]@InProceedings{Viriyasaranon_2024_ACCV, author = {Viriyasaranon, Thanaporn and Ma, Serie and Choi, Jang-Hwan}, title = {GeoRefineNet: A Multistage Framework for Enhanced Cephalometric Landmark Detection in CBCT Images Using 3D Geometric Information}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3107-3119} }
AutoAD-Zero: A Training-Free Framework for Zero-Shot Audio Description-
[pdf]
[bibtex]@InProceedings{Xie_2024_ACCV, author = {Xie, Junyu and Han, Tengda and Bain, Max and Nagrani, Arsha and Varol, G\"ul and Xie, Weidi and Zisserman, Andrew}, title = {AutoAD-Zero: A Training-Free Framework for Zero-Shot Audio Description}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2265-2281} }
LocoMotion: Learning Motion-Focused Video-Language Representations-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Doughty_2024_ACCV, author = {Doughty, Hazel and Thoker, Fida Mohammad and Snoek, Cees G. M.}, title = {LocoMotion: Learning Motion-Focused Video-Language Representations}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {50-70} }
D'OH: Decoder-Only Random Hypernetworks for Implicit Neural Representations-
[pdf]
[supp]
[bibtex]@InProceedings{Gordon_2024_ACCV, author = {Gordon, Cameron and MacDonald, Lachlan E. and Saratchandran, Hemanth and Lucey, Simon}, title = {D'OH: Decoder-Only Random Hypernetworks for Implicit Neural Representations}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2507-2526} }
Cross Feature Fusion of Fundus Image and Generated Lesion Map for Referable Diabetic Retinopathy Classification-
[pdf]
[arXiv]
[bibtex]@InProceedings{Mok_2024_ACCV, author = {Mok, Dahyun and Bum, Junghyun and Tai, Le Duc and Choo, Hyunseung}, title = {Cross Feature Fusion of Fundus Image and Generated Lesion Map for Referable Diabetic Retinopathy Classification}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1350-1365} }
Randomized Channel-pass Mask for Channel-wise Explanation of Black-box Models-
[pdf]
[bibtex]@InProceedings{Hachiya_2024_ACCV, author = {Hachiya, Hirotaka and Nisawa, Daiki}, title = {Randomized Channel-pass Mask for Channel-wise Explanation of Black-box Models}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3756-3770} }
DPL: Cross-quality DeepFake Detection via Dual Progressive Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Dongliang and Li, Yunfei and Zhou, Jiaran and Li, Yuezun}, title = {DPL: Cross-quality DeepFake Detection via Dual Progressive Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1116-1132} }
Diffusion Model Compression for Image-to-Image Translation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2024_ACCV, author = {Kim, Geonung and Kim, Beomsu and Park, Eunhyeok and Cho, Sunghyun}, title = {Diffusion Model Compression for Image-to-Image Translation}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2105-2123} }
Contrastive Max-correlation for Multi-view Clustering-
[pdf]
[bibtex]@InProceedings{Deng_2024_ACCV, author = {Deng, Yanghao and Wang, Zenghui and Du, Songlin}, title = {Contrastive Max-correlation for Multi-view Clustering}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {499-512} }
Robust Visual Reinforcement Learning by Prompt Tuning-
[pdf]
[supp]
[bibtex]@InProceedings{Tran_2024_ACCV, author = {Tran, Tung and Than, Khoat and Vargas, Danilo}, title = {Robust Visual Reinforcement Learning by Prompt Tuning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1133-1147} }
LoLI-Street: Benchmarking Low-light Image Enhancement and Beyond-
[pdf]
[supp]
[bibtex]@InProceedings{Islam_2024_ACCV, author = {Islam, Md Tanvir and Alam, Inzamamul and Woo, Simon S. and Anwar, Saeed and Lee, IK Hyun and Muhammad, Khan}, title = {LoLI-Street: Benchmarking Low-light Image Enhancement and Beyond}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1250-1267} }
Fine-tuning Large Language Models for Automatic Font Skeleton Generation: Exploration and Analysis-
[pdf]
[bibtex]@InProceedings{Liu_2024_ACCV, author = {Liu, Yuxuan and Fujii, Yasuhisa and Zhu, Xinru and Nohara, Kayoko}, title = {Fine-tuning Large Language Models for Automatic Font Skeleton Generation: Exploration and Analysis}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4156-4171} }
Pluggable Style Representation Learning for Multi-Style Transfer-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2024_ACCV, author = {Liu, Hongda and Wang, Longguang and Guan, Weijun and Zhang, Ye and Guo, Yulan}, title = {Pluggable Style Representation Learning for Multi-Style Transfer}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {2087-2104} }
CNN Mixture-of-Depths-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cakaj_2024_ACCV, author = {Cakaj, Rinor and Mehnert, Jens and Yang, Bin}, title = {CNN Mixture-of-Depths}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3480-3498} }
Optimized Breast Lesion Segmentation in Ultrasound Videos Across Varied Resource-Scant Environments-
[pdf]
[bibtex]@InProceedings{Li_2024_ACCV, author = {Li, Yunhao and Chen, Zibin and Yan, Junming and Ding, Ziyu and Li, Jie and Huang, Teng and Pei, Xiaoqing and Zhang, Zheng and Wang, Qiong and Pang, Yan}, title = {Optimized Breast Lesion Segmentation in Ultrasound Videos Across Varied Resource-Scant Environments}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4318-4333} }
Wavelet-based Mamba with Fourier Adjustment for Low-light Image Enhancement-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Tan_2024_ACCV, author = {Tan, Junhao and Pei, Songwen and Qin, Wei and Fu, Bo and Li, Ximing and Huang, Libo}, title = {Wavelet-based Mamba with Fourier Adjustment for Low-light Image Enhancement}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3449-3464} }
Spectral Modality-Aware Interactive Fusion Network for HSI Super-Resolution-
[pdf]
[bibtex]@InProceedings{Xu_2024_ACCV, author = {Xu, Meng and Mao, Jiayou and Mo, Ziqian and Fu, Xiyou and Jia, Sen}, title = {Spectral Modality-Aware Interactive Fusion Network for HSI Super-Resolution}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4544-4560} }
MonoDSSMs: Efficient Monocular 3D Object Detection with Depth-Aware State Space Models-
[pdf]
[bibtex]@InProceedings{Vu_2024_ACCV, author = {Vu, Kiet Dang and Tran, Trung Thai and Nguyen, Duc Dung}, title = {MonoDSSMs: Efficient Monocular 3D Object Detection with Depth-Aware State Space Models}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3883-3900} }
BootsTAP: Bootstrapped Training for Tracking-Any-Point-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Doersch_2024_ACCV, author = {Doersch, Carl and Luc, Pauline and Yang, Yi and Gokay, Dilara and Koppula, Skanda and Gupta, Ankush and Heyward, Joseph and Rocco, Ignacio and Goroshin, Ross and Carreira, Jo\~ao and Zisserman, Andrew}, title = {BootsTAP: Bootstrapped Training for Tracking-Any-Point}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3257-3274} }
Match me if you can: Semi-Supervised Semantic Correspondence Learning with Unpaired Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kim_2024_ACCV, author = {Kim, Jiwon and Heo, Byeongho and Yun, Sangdoo and Kim, Seungryong and Han, Dongyoon}, title = {Match me if you can: Semi-Supervised Semantic Correspondence Learning with Unpaired Images}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3154-3171} }
HMGS: Hybrid Model of Gaussian Splatting for Enhancing 3D Reconstruction with Reflections-
[pdf]
[bibtex]@InProceedings{Zhang_2024_ACCV, author = {Zhang, Hengbin and Wang, Chengliang and Liu, Ji and Jiang, Tian and Luo, Yonggang and Xie, Lecheng}, title = {HMGS: Hybrid Model of Gaussian Splatting for Enhancing 3D Reconstruction with Reflections}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3819-3835} }
Do they Share the Same Tail? Learning Individual Compositional Attribute Prototype for Generalized Zero-Shot Learning-
[pdf]
[bibtex]@InProceedings{Shi_2024_ACCV, author = {Shi, Yuyan and Jiang, Chenyi and Shi, Run and Zhang, Haofeng}, title = {Do they Share the Same Tail? Learning Individual Compositional Attribute Prototype for Generalized Zero-Shot Learning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4595-4611} }
Multiview Detection with Cardboard Human Modeling-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Ma_2024_ACCV, author = {Ma, Jiahao and Duan, Zicheng and Zheng, Liang and Nguyen, Chuong}, title = {Multiview Detection with Cardboard Human Modeling}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {870-886} }
Class-Aware Contrastive Learning for Fine-Grained Skeleton-Based Action Recognition-
[pdf]
[bibtex]@InProceedings{Bian_2024_ACCV, author = {Bian, Xinyu and Chang, Dongliang and Yang, Yuqi and He, Zhongjiang and Liang, Kongming and Ma, Zhanyu}, title = {Class-Aware Contrastive Learning for Fine-Grained Skeleton-Based Action Recognition}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3638-3654} }
HAHA: Highly Articulated Gaussian Human Avatars with Textured Mesh Prior-
[pdf]
[arXiv]
[bibtex]@InProceedings{Svitov_2024_ACCV, author = {Svitov, David and Morerio, Pietro and Agapito, Lourdes and Del Bue, Alessio}, title = {HAHA: Highly Articulated Gaussian Human Avatars with Textured Mesh Prior}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4051-4068} }
Moving Object Segmentation: All You Need Is SAM (and Flow)-
[pdf]
[arXiv]
[bibtex]@InProceedings{Xie_2024_ACCV, author = {Xie, Junyu and Yang, Charig and Xie, Weidi and Zisserman, Andrew}, title = {Moving Object Segmentation: All You Need Is SAM (and Flow)}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {162-178} }
EQ-CBM: A Probabilistic Concept Bottleneck with Energy-based Models and Quantized Vectors-
[pdf]
[bibtex]@InProceedings{Kim_2024_ACCV, author = {Kim, Sangwon and Ahn, Dasom and Ko, Byoung Chul and Jang, In-su and Kim, Kwang-Ju}, title = {EQ-CBM: A Probabilistic Concept Bottleneck with Energy-based Models and Quantized Vectors}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3432-3448} }
SpikeGS: Learning 3D Gaussian Fields from Continuous Spike Stream-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yu_2024_ACCV, author = {Yu, Jinze and Peng, Xin and Lu, Zhengda and Kneip, Laurent and Wang, Yiqun}, title = {SpikeGS: Learning 3D Gaussian Fields from Continuous Spike Stream}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4280-4298} }
M-RAT: a Multi-grained Retrieval Augmentation Transformer for Image Captioning-
[pdf]
[bibtex]@InProceedings{Song_2024_ACCV, author = {Song, Jiayan and Pan, Renjie and Zhou, Jun and Yang, Hua}, title = {M-RAT: a Multi-grained Retrieval Augmentation Transformer for Image Captioning}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {3865-3882} }
Cross-Modality Complementary Learning for Video-based Cloth-Changing Person Re-Identification-
[pdf]
[supp]
[bibtex]@InProceedings{Nguyen_2024_ACCV, author = {Nguyen, Vuong D. and Mantini, Pranav and Shah, Shishir K.}, title = {Cross-Modality Complementary Learning for Video-based Cloth-Changing Person Re-Identification}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {88-107} }
ULTRON: Unifying Local Transformer and Convolution for Large-scale Image Retrieval-
[pdf]
[supp]
[bibtex]@InProceedings{Kweon_2024_ACCV, author = {Kweon, Minseong and Park, Jinsun}, title = {ULTRON: Unifying Local Transformer and Convolution for Large-scale Image Retrieval}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4000-4016} }
KhmerST: A Low-Resource Khmer Scene Text Detection and Recognition Benchmark-
[pdf]
[arXiv]
[bibtex]@InProceedings{Nom_2024_ACCV, author = {Nom, Vannkinh and Bakkali, Souhail and Luqman, Muhammad Muzzamil and Coustaty, Micka\"el and Ogier, Jean-Marc}, title = {KhmerST: A Low-Resource Khmer Scene Text Detection and Recognition Benchmark}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {1777-1792} }
On Unsupervised Partial Shape Correspondence-
[pdf]
[supp]
[bibtex]@InProceedings{Bracha_2024_ACCV, author = {Bracha, Amit and Dag\`es, Thomas and Kimmel, Ron}, title = {On Unsupervised Partial Shape Correspondence}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4488-4504} }
Learning Non-Uniform Step Sizes for Neural Network Quantization-
[pdf]
[supp]
[bibtex]@InProceedings{Gongyo_2024_ACCV, author = {Gongyo, Shinya and Liang, Jinrong and Ambai, Mitsuru and Kawakami, Rei and Sato, Ikuro}, title = {Learning Non-Uniform Step Sizes for Neural Network Quantization}, booktitle = {Proceedings of the Asian Conference on Computer Vision (ACCV)}, month = {December}, year = {2024}, pages = {4385-4402} }