8th AI City Challenge


An Online Approach and Evaluation Method for Tracking People Across Cameras in Extremely Long Video Sequence
Cheng-Yen Yang,
Hsiang-Wei Huang,
Pyong-Kun Kim,
Zhongyu Jiang,
Kwang-Ju Kim,
Chung-I Huang,
Haiqing Du,
Jenq-Neng Hwang
[pdf]
[bibtex]
@InProceedings{Yang_2024_CVPR, author = {Yang, Cheng-Yen and Huang, Hsiang-Wei and Kim, Pyong-Kun and Jiang, Zhongyu and Kim, Kwang-Ju and Huang, Chung-I and Du, Haiqing and Hwang, Jenq-Neng}, title = {An Online Approach and Evaluation Method for Tracking People Across Cameras in Extremely Long Video Sequence}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7037-7045} }

OCMCTrack: Online Multi-Target Multi-Camera Tracking with Corrective Matching Cascade
Andreas Specker
[pdf]
[bibtex]
@InProceedings{Specker_2024_CVPR, author = {Specker, Andreas}, title = {OCMCTrack: Online Multi-Target Multi-Camera Tracking with Corrective Matching Cascade}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7236-7244} }

An Effective Method for Detecting Violation of Helmet Rule for Motorcyclists
Yunliang Chen,
Wei Zhou,
Zicen Zhou,
Bing Ma,
Chen Wang,
Yingda Shang,
An Guo,
Tianshu Chu
[pdf]
[bibtex]
@InProceedings{Chen_2024_CVPR, author = {Chen, Yunliang and Zhou, Wei and Zhou, Zicen and Ma, Bing and Wang, Chen and Shang, Yingda and Guo, An and Chu, Tianshu}, title = {An Effective Method for Detecting Violation of Helmet Rule for Motorcyclists}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7085-7090} }

Simple In-place Data Augmentation for Surveillance Object Detection
Munkh-Erdene Otgonbold,
Ganzorig Batnasan,
Munkhjargal Gochoo
[pdf] [arXiv]
[bibtex]
@InProceedings{Otgonbold_2024_CVPR, author = {Otgonbold, Munkh-Erdene and Batnasan, Ganzorig and Gochoo, Munkhjargal}, title = {Simple In-place Data Augmentation for Surveillance Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7208-7216} }

Robust Data Augmentation and Ensemble Method for Object Detection in Fisheye Camera Images
Viet Hung Duong,
Duc Quyen Nguyen,
Thien Van Luong,
Huan Vu,
Tien Cuong Nguyen
[pdf]
[bibtex]
@InProceedings{Duong_2024_CVPR, author = {Duong, Viet Hung and Nguyen, Duc Quyen and Van Luong, Thien and Vu, Huan and Nguyen, Tien Cuong}, title = {Robust Data Augmentation and Ensemble Method for Object Detection in Fisheye Camera Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7017-7026} }

FE-Det: An Effective Traffic Object Detection Framework for Fish-Eye Cameras
Xingshuang Luo,
Zhe Cui,
Fei Su
[pdf]
[bibtex]
@InProceedings{Luo_2024_CVPR, author = {Luo, Xingshuang and Cui, Zhe and Su, Fei}, title = {FE-Det: An Effective Traffic Object Detection Framework for Fish-Eye Cameras}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7091-7099} }

DeepLocalization: Using Change Point Detection for Temporal Action Localization
Mohammed Shaiqur Rahman,
Ibne Farabi Shihab,
Lynna Chu,
Anuj Sharma
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rahman_2024_CVPR, author = {Rahman, Mohammed Shaiqur and Shihab, Ibne Farabi and Chu, Lynna and Sharma, Anuj}, title = {DeepLocalization: Using Change Point Detection for Temporal Action Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7252-7260} }

Online Multi-camera People Tracking with Spatial-temporal Mechanism and Anchor-feature Hierarchical Clustering
Riu Cherdchusakulchai,
Sasin Phimsiri,
Visarut Trairattanapa,
Suchat Tungjitnob,
Wasu Kudisthalert,
Pornprom Kiawjak,
Ek Thamwiwatthana,
Phawat Borisuitsawat,
Teepakorn Tosawadi,
Pakcheera Choppradit,
Kasisdis Mahakijdechachai,
Supawit Vatathanavaro,
Worawit Saetan,
Vasin Suttichaya
[pdf]
[bibtex]
@InProceedings{Cherdchusakulchai_2024_CVPR, author = {Cherdchusakulchai, Riu and Phimsiri, Sasin and Trairattanapa, Visarut and Tungjitnob, Suchat and Kudisthalert, Wasu and Kiawjak, Pornprom and Thamwiwatthana, Ek and Borisuitsawat, Phawat and Tosawadi, Teepakorn and Choppradit, Pakcheera and Mahakijdechachai, Kasisdis and Vatathanavaro, Supawit and Saetan, Worawit and Suttichaya, Vasin}, title = {Online Multi-camera People Tracking with Spatial-temporal Mechanism and Anchor-feature Hierarchical Clustering}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7198-7207} }

Cluster Self-Refinement for Enhanced Online Multi-Camera People Tracking
Jeongho Kim,
Wooksu Shin,
Hancheol Park,
Donghyuk Choi
[pdf]
[bibtex]
@InProceedings{Kim_2024_CVPR, author = {Kim, Jeongho and Shin, Wooksu and Park, Hancheol and Choi, Donghyuk}, title = {Cluster Self-Refinement for Enhanced Online Multi-Camera People Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7190-7197} }

Improving Object Detection to Fisheye Cameras with Open-Vocabulary Pseudo-Label Approach
Long Hoang Pham,
Quoc Pham-Nam Ho,
Duong Nguyen-Ngoc Tran,
Tai Huu-Phuong Tran,
Huy-Hung Nguyen,
Duong Khac Vu,
Chi Dai Tran,
Ngoc Doan-Minh Huynh,
Hyung-Min Jeon,
Hyung-Joon Jeon,
Jae Wook Jeon
[pdf]
[bibtex]
@InProceedings{Pham_2024_CVPR, author = {Pham, Long Hoang and Ho, Quoc Pham-Nam and Tran, Duong Nguyen-Ngoc and Tran, Tai Huu-Phuong and Nguyen, Huy-Hung and Vu, Duong Khac and Tran, Chi Dai and Huynh, Ngoc Doan-Minh and Jeon, Hyung-Min and Jeon, Hyung-Joon and Jeon, Jae Wook}, title = {Improving Object Detection to Fisheye Cameras with Open-Vocabulary Pseudo-Label Approach}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7100-7107} }

Multi-View Spatial-Temporal Learning for Understanding Unusual Behaviors in Untrimmed Naturalistic Driving Videos
Huy-Hung Nguyen,
Chi Dai Tran,
Long Hoang Pham,
Duong Nguyen-Ngoc Tran,
Tai Huu-Phuong Tran,
Duong Khac Vu,
Quoc Pham-Nam Ho,
Ngoc Doan-Minh Huynh,
Hyung-Min Jeon,
Hyung-Joon Jeon,
Jae Wook Jeon
[pdf]
[bibtex]
@InProceedings{Nguyen_2024_CVPR, author = {Nguyen, Huy-Hung and Tran, Chi Dai and Pham, Long Hoang and Tran, Duong Nguyen-Ngoc and Tran, Tai Huu-Phuong and Vu, Duong Khac and Ho, Quoc Pham-Nam and Huynh, Ngoc Doan-Minh and Jeon, Hyung-Min and Jeon, Hyung-Joon and Jeon, Jae Wook}, title = {Multi-View Spatial-Temporal Learning for Understanding Unusual Behaviors in Untrimmed Naturalistic Driving Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7144-7152} }

Low-Light Image Enhancement Framework for Improved Object Detection in Fisheye Lens Datasets
Dai Quoc Tran,
Armstrong Aboah,
Yuntae Jeon,
Maged Shoman,
Minsoo Park,
Seunghee Park
[pdf] [arXiv]
[bibtex]
@InProceedings{Tran_2024_CVPR, author = {Tran, Dai Quoc and Aboah, Armstrong and Jeon, Yuntae and Shoman, Maged and Park, Minsoo and Park, Seunghee}, title = {Low-Light Image Enhancement Framework for Improved Object Detection in Fisheye Lens Datasets}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7056-7065} }

TrafficVLM: A Controllable Visual Language Model for Traffic Video Captioning
Quang Minh Dinh,
Minh Khoi Ho,
Anh Quan Dang,
Hung Phong Tran
[pdf] [arXiv]
[bibtex]
@InProceedings{Dinh_2024_CVPR, author = {Dinh, Quang Minh and Ho, Minh Khoi and Dang, Anh Quan and Tran, Hung Phong}, title = {TrafficVLM: A Controllable Visual Language Model for Traffic Video Captioning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7134-7143} }

Road Object Detection Robust to Distorted Objects at the Edge Regions of Images
Wooksu Shin,
Donghyuk Choi,
Hancheol Park,
Jeongho Kim
[pdf]
[bibtex]
@InProceedings{Shin_2024_CVPR, author = {Shin, Wooksu and Choi, Donghyuk and Park, Hancheol and Kim, Jeongho}, title = {Road Object Detection Robust to Distorted Objects at the Edge Regions of Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7245-7251} }

Divide and Conquer Boosting for Enhanced Traffic Safety Description and Analysis with Large Vision Language Model
Khai Trinh Xuan,
Khoi Nguyen Nguyen,
Bach Hoang Ngo,
Vu Dinh Xuan,
Minh-Hung An,
Quang-Vinh Dinh
[pdf]
[bibtex]
@InProceedings{Xuan_2024_CVPR, author = {Xuan, Khai Trinh and Nguyen, Khoi Nguyen and Ngo, Bach Hoang and Xuan, Vu Dinh and An, Minh-Hung and Dinh, Quang-Vinh}, title = {Divide and Conquer Boosting for Enhanced Traffic Safety Description and Analysis with Large Vision Language Model}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7046-7055} }

Motorcyclist Helmet Violation Detection Framework by Leveraging Robust Ensemble and Augmentation Methods
Thien Van Luong,
Huu Si Phuc Nguyen,
Duy Khanh Dinh,
Viet Hung Duong,
Duy Hong Sam Vo,
Huan Vu,
Minh Tuan Hoang,
Tien Cuong Nguyen
[pdf]
[bibtex]
@InProceedings{Van_Luong_2024_CVPR, author = {Van Luong, Thien and Nguyen, Huu Si Phuc and Dinh, Duy Khanh and Duong, Viet Hung and Vo, Duy Hong Sam and Vu, Huan and Hoang, Minh Tuan and Nguyen, Tien Cuong}, title = {Motorcyclist Helmet Violation Detection Framework by Leveraging Robust Ensemble and Augmentation Methods}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7027-7036} }

Augmented Self-Mask Attention Transformer for Naturalistic Driving Action Recognition
Tiantian Zhang,
Qingtian Wang,
Xiaodong Dong,
Wenqing Yu,
Hao Sun,
Xuyang Zhou,
Aigong Zhen,
Shun Cui,
Dong Wu,
Zhongjiang He
[pdf]
[bibtex]
@InProceedings{Zhang_2024_CVPR, author = {Zhang, Tiantian and Wang, Qingtian and Dong, Xiaodong and Yu, Wenqing and Sun, Hao and Zhou, Xuyang and Zhen, Aigong and Cui, Shun and Wu, Dong and He, Zhongjiang}, title = {Augmented Self-Mask Attention Transformer for Naturalistic Driving Action Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7108-7114} }

Efficient Online Multi-Camera Tracking with Memory-Efficient Accumulated Appearance Features and Trajectory Validation
Lap Quoc Tran,
Huan Duc Vi
[pdf]
[bibtex]
@InProceedings{Tran_2024_CVPR, author = {Tran, Lap Quoc and Vi, Huan Duc}, title = {Efficient Online Multi-Camera Tracking with Memory-Efficient Accumulated Appearance Features and Trajectory Validation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7217-7226} }

Enhancing Traffic Safety with Parallel Dense Video Captioning for End-to-End Event Analysis
Maged Shoman,
Dongdong Wang,
Armstrong Aboah,
Mohamed Abdel-Aty
[pdf] [arXiv]
[bibtex]
@InProceedings{Shoman_2024_CVPR, author = {Shoman, Maged and Wang, Dongdong and Aboah, Armstrong and Abdel-Aty, Mohamed}, title = {Enhancing Traffic Safety with Parallel Dense Video Captioning for End-to-End Event Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7125-7133} }

Robust Motorcycle Helmet Detection in Real-World Scenarios: Using Co-DETR and Minority Class Enhancement
Hao Vo,
Sieu Tran,
Duc Minh Nguyen,
Thua Nguyen,
Tien Do,
Duy-Dinh Le,
Thanh Duc Ngo
[pdf]
[bibtex]
@InProceedings{Vo_2024_CVPR, author = {Vo, Hao and Tran, Sieu and Nguyen, Duc Minh and Nguyen, Thua and Do, Tien and Le, Duy-Dinh and Ngo, Thanh Duc}, title = {Robust Motorcycle Helmet Detection in Real-World Scenarios: Using Co-DETR and Minority Class Enhancement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7163-7171} }

A Coarse-to-fine Two-stage Helmet Detection Method for Motorcyclists
Hongpu Zhang,
Zhe Cui,
Fei Su
[pdf]
[bibtex]
@InProceedings{Zhang_2024_CVPR, author = {Zhang, Hongpu and Cui, Zhe and Su, Fei}, title = {A Coarse-to-fine Two-stage Helmet Detection Method for Motorcyclists}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7066-7074} }

Overlap Suppression Clustering for Offline Multi-Camera People Tracking
Ryuto Yoshida,
Junichi Okubo,
Junichiro Fujii,
Masazumi Amakata,
Takayoshi Yamashita
[pdf]
[bibtex]
@InProceedings{Yoshida_2024_CVPR, author = {Yoshida, Ryuto and Okubo, Junichi and Fujii, Junichiro and Amakata, Masazumi and Yamashita, Takayoshi}, title = {Overlap Suppression Clustering for Offline Multi-Camera People Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7153-7162} }

The 8th AI City Challenge
Shuo Wang,
David C. Anastasiu,
Zheng Tang,
Ming-Ching Chang,
Yue Yao,
Liang Zheng,
Mohammed Shaiqur Rahman,
Meenakshi S. Arya,
Anuj Sharma,
Pranamesh Chakraborty,
Sanjita Prajapati,
Quan Kong,
Norimasa Kobori,
Munkhjargal Gochoo,
Munkh-Erdene Otgonbold,
Fady Alnajjar,
Ganzorig Batnasan,
Ping-Yang Chen,
Jun-Wei Hsieh,
Xunlei Wu,
Sameer Satish Pusegaonkar,
Yizhou Wang,
Sujit Biswas,
Rama Chellappa
[pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2024_CVPR, author = {Wang, Shuo and Anastasiu, David C. and Tang, Zheng and Chang, Ming-Ching and Yao, Yue and Zheng, Liang and Rahman, Mohammed Shaiqur and Arya, Meenakshi S. and Sharma, Anuj and Chakraborty, Pranamesh and Prajapati, Sanjita and Kong, Quan and Kobori, Norimasa and Gochoo, Munkhjargal and Otgonbold, Munkh-Erdene and Alnajjar, Fady and Batnasan, Ganzorig and Chen, Ping-Yang and Hsieh, Jun-Wei and Wu, Xunlei and Pusegaonkar, Sameer Satish and Wang, Yizhou and Biswas, Sujit and Chellappa, Rama}, title = {The 8th AI City Challenge}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7261-7272} }

Enhancing Road Object Detection in Fisheye Cameras: An Effective Framework Integrating SAHI and Hybrid Inference
Bao Tran Gia,
Tuong Bui Cong Khanh,
Hien Ho Trong,
Thuyen Tran Doan,
Tien Do,
Duy-Dinh Le,
Thanh Duc Ngo
[pdf]
[bibtex]
@InProceedings{Gia_2024_CVPR, author = {Gia, Bao Tran and Khanh, Tuong Bui Cong and Trong, Hien Ho and Doan, Thuyen Tran and Do, Tien and Le, Duy-Dinh and Ngo, Thanh Duc}, title = {Enhancing Road Object Detection in Fisheye Cameras: An Effective Framework Integrating SAHI and Hybrid Inference}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7227-7235} }

A Robust Online Multi-Camera People Tracking System With Geometric Consistency and State-aware Re-ID Correction
Zhenyu Xie,
Zelin Ni,
Wenjie Yang,
Yuang Zhang,
Yihang Chen,
Yang Zhang,
Xiao Ma
[pdf]
[bibtex]
@InProceedings{Xie_2024_CVPR, author = {Xie, Zhenyu and Ni, Zelin and Yang, Wenjie and Zhang, Yuang and Chen, Yihang and Zhang, Yang and Ma, Xiao}, title = {A Robust Online Multi-Camera People Tracking System With Geometric Consistency and State-aware Re-ID Correction}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7007-7016} }

KI-GAN: Knowledge-Informed Generative Adversarial Networks for Enhanced Multi-Vehicle Trajectory Forecasting at Signalized Intersections
Chuheng Wei,
Guoyuan Wu,
Matthew J. Barth,
Amr Abdelraouf,
Rohit Gupta,
Kyungtae Han
[pdf]
[bibtex]
@InProceedings{Wei_2024_CVPR, author = {Wei, Chuheng and Wu, Guoyuan and Barth, Matthew J. and Abdelraouf, Amr and Gupta, Rohit and Han, Kyungtae}, title = {KI-GAN: Knowledge-Informed Generative Adversarial Networks for Enhanced Multi-Vehicle Trajectory Forecasting at Signalized Intersections}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7115-7124} }

Multi-View Action Recognition for Distracted Driver Behavior Localization
Yuehuan Xu,
Shuai Jiang,
Zhe Cui,
Fei Su
[pdf]
[bibtex]
@InProceedings{Xu_2024_CVPR, author = {Xu, Yuehuan and Jiang, Shuai and Cui, Zhe and Su, Fei}, title = {Multi-View Action Recognition for Distracted Driver Behavior Localization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7172-7179} }

Multi-perspective Traffic Video Description Model with Fine-grained Refinement Approach
Tuan-An To,
Minh-Nam Tran,
Trong-Bao Ho,
Thien-Loc Ha,
Quang-Tan Nguyen,
Hoang-Chau Luong,
Thanh-Duy Cao,
Minh-Triet Tran
[pdf]
[bibtex]
@InProceedings{To_2024_CVPR, author = {To, Tuan-An and Tran, Minh-Nam and Ho, Trong-Bao and Ha, Thien-Loc and Nguyen, Quang-Tan and Luong, Hoang-Chau and Cao, Thanh-Duy and Tran, Minh-Triet}, title = {Multi-perspective Traffic Video Description Model with Fine-grained Refinement Approach}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7075-7084} }

CityLLaVA: Efficient Fine-Tuning for VLMs in City Scenario
Zhizhao Duan,
Hao Cheng,
Duo Xu,
Xi Wu,
Xiangxie Zhang,
Xi Ye,
Zhen Xie
[pdf] [arXiv]
[bibtex]
@InProceedings{Duan_2024_CVPR, author = {Duan, Zhizhao and Cheng, Hao and Xu, Duo and Wu, Xi and Zhang, Xiangxie and Ye, Xi and Xie, Zhen}, title = {CityLLaVA: Efficient Fine-Tuning for VLMs in City Scenario}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7180-7189} }