CVPR 2026 Open Access Repository

Computer Vision × Education: Building a Cross‑Community Agenda for Multimodal Vision in Classrooms

Scaffolding Human Learning by Shaping Visual Environment: Yuji Zhang,

Duo Zhou,

Bo Chen,

Aditya Chalasani,

Noah Schroeder,

H Chad Lane,

ChengXiang Zhai; [pdf]
[bibtex]
@InProceedings{Zhang_2026_CVPR, author = {Zhang, Yuji and Zhou, Duo and Chen, Bo and Chalasani, Aditya and Schroeder, Noah and Lane, H Chad and Zhai, ChengXiang}, title = {Scaffolding Human Learning by Shaping Visual Environment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10922-10931} }
From Emotion Recognition to Mind-Wandering Detection: A Comparative Analysis of Video-Based Emotion Foundation Models: Ekta Sood,

Sebastian Ricke,

Trisha Mittal,

Sidney K DMello; [pdf]
[bibtex]
@InProceedings{Sood_2026_CVPR, author = {Sood, Ekta and Ricke, Sebastian and Mittal, Trisha and DMello, Sidney K}, title = {From Emotion Recognition to Mind-Wandering Detection: A Comparative Analysis of Video-Based Emotion Foundation Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10874-10882} }
Evaluating Web-trained Facial Expression Recognition in Naturalistic Collaborative Learning: Sifatul Anindho,

Videep Venkatesha,

Nathaniel Blanchard; [pdf] [supp]
[bibtex]
@InProceedings{Anindho_2026_CVPR, author = {Anindho, Sifatul and Venkatesha, Videep and Blanchard, Nathaniel}, title = {Evaluating Web-trained Facial Expression Recognition in Naturalistic Collaborative Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10789-10798} }
InterventionLens: A Multi-Agent Framework for Detecting ASD Intervention Strategies in Parent-Child Shared Reading: Xiao Wang,

Lu Dong,

Ifeoma Nwogu,

Srirangaraj Setlur,

Venu Govindaraju; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2026_CVPR, author = {Wang, Xiao and Dong, Lu and Nwogu, Ifeoma and Setlur, Srirangaraj and Govindaraju, Venu}, title = {InterventionLens: A Multi-Agent Framework for Detecting ASD Intervention Strategies in Parent-Child Shared Reading}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10904-10911} }
Cross-modal Affinity-aligned Multimodal Learning Analytics for Predicting Student Collaboration Satisfaction in Game-Based Learning: Wen-Hsin Tsai,

Chia-Ming Lee,

Yuk-Ying Tung; [pdf] [arXiv]
[bibtex]
@InProceedings{Tsai_2026_CVPR, author = {Tsai, Wen-Hsin and Lee, Chia-Ming and Tung, Yuk-Ying}, title = {Cross-modal Affinity-aligned Multimodal Learning Analytics for Predicting Student Collaboration Satisfaction in Game-Based Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10893-10903} }
Context Matters: Peer-Aware Student Behavioral Engagement Measurement via VLM Action Parsing and LLM Sequence Classification: Ahmed Abdelkawy,

Ahmed Elsayed,

Asem Ali,

Aly Farag,

Thomas Tretter,

Michael McIntyre; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Abdelkawy_2026_CVPR, author = {Abdelkawy, Ahmed and Elsayed, Ahmed and Ali, Asem and Farag, Aly and Tretter, Thomas and McIntyre, Michael}, title = {Context Matters: Peer-Aware Student Behavioral Engagement Measurement via VLM Action Parsing and LLM Sequence Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10779-10788} }
CSU101: An Educational Dataset for Introductory Computer Vision: Ethan Seefried,

Changsoo Jung,

Videep Venkatesha,

Trevor Chartier,

Caleb Christian,

Jack Fitzgerald,

Mariah Bradford,

Sifatul Anindho,

Matthew Sturgeon,

Nathaniel Blanchard; [pdf]
[bibtex]
@InProceedings{Seefried_2026_CVPR, author = {Seefried, Ethan and Jung, Changsoo and Venkatesha, Videep and Chartier, Trevor and Christian, Caleb and Fitzgerald, Jack and Bradford, Mariah and Anindho, Sifatul and Sturgeon, Matthew and Blanchard, Nathaniel}, title = {CSU101: An Educational Dataset for Introductory Computer Vision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10864-10873} }
Speech-Synchronized Whiteboard Generation via VLM-Driven Structured Drawing Representations: Suraj Prasad,

Pinak Mahapatra; [pdf] [arXiv]
[bibtex]
@InProceedings{Prasad_2026_CVPR, author = {Prasad, Suraj and Mahapatra, Pinak}, title = {Speech-Synchronized Whiteboard Generation via VLM-Driven Structured Drawing Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10859-10863} }
VLMath: A Multimodal Vision-Language System for Pedagogically Aligned Math Tutoring: Mahsa Ardakani,

Arshia Eslami,

Ramtin Zand; [pdf] [supp]
[bibtex]
@InProceedings{Ardakani_2026_CVPR, author = {Ardakani, Mahsa and Eslami, Arshia and Zand, Ramtin}, title = {VLMath: A Multimodal Vision-Language System for Pedagogically Aligned Math Tutoring}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10799-10809} }
AI-Assisted Competency Assessment from Egocentric Video in Simulation-Based Nursing Education: Hanchen David Wang,

Yilin Liu,

Madison J. Mason,

Surya Chand Rayala,

Gautam Biswas,

Daniel T. Levin,

Meiyi Ma; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2026_CVPR, author = {Wang, Hanchen David and Liu, Yilin and Mason, Madison J. and Rayala, Surya Chand and Biswas, Gautam and Levin, Daniel T. and Ma, Meiyi}, title = {AI-Assisted Competency Assessment from Egocentric Video in Simulation-Based Nursing Education}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10912-10921} }
MES-Bench: A Benchmark for Multimodal Elaborative Simplification and Comprehensibility Evaluation in Language Learning: Martyna Gruszka,

Risa Shinoda,

Taiki Miyanishi,

Takumi Hirose,

Nakamasa Inoue; [pdf]
[bibtex]
@InProceedings{Gruszka_2026_CVPR, author = {Gruszka, Martyna and Shinoda, Risa and Miyanishi, Taiki and Hirose, Takumi and Inoue, Nakamasa}, title = {MES-Bench: A Benchmark for Multimodal Elaborative Simplification and Comprehensibility Evaluation in Language Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10820-10829} }
ReSoFed: Reliability-Guided Model Souping for Robust Federated Learning in Heterogeneous Classroom Environments: Muhammad Rafsan Kabir,

Md Shopon,

Marina L. Gavrilova; [pdf]
[bibtex]
@InProceedings{Kabir_2026_CVPR, author = {Kabir, Muhammad Rafsan and Shopon, Md and Gavrilova, Marina L.}, title = {ReSoFed: Reliability-Guided Model Souping for Robust Federated Learning in Heterogeneous Classroom Environments}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10839-10848} }
Delta-Gated Incremental Multi-Forward-Pass Modeling for Robust Multimodal Classroom Video Understanding: Chongyu He,

Peter Youngs,

Scott Acton; [pdf]
[bibtex]
@InProceedings{He_2026_CVPR, author = {He, Chongyu and Youngs, Peter and Acton, Scott}, title = {Delta-Gated Incremental Multi-Forward-Pass Modeling for Robust Multimodal Classroom Video Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10830-10838} }
Sequence-Based Identification of First-Person Camera Wearers in Third-Person Views: Ziwei Zhao,

Xizi Wang,

Yuchen Wang,

Feng Cheng,

David Crandall; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2026_CVPR, author = {Zhao, Ziwei and Wang, Xizi and Wang, Yuchen and Cheng, Feng and Crandall, David}, title = {Sequence-Based Identification of First-Person Camera Wearers in Third-Person Views}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10932-10943} }
Do Emotion Recognition Models Generalize to Classrooms? Robustness and Fairness Analysis: Ashwin T S,

Srigowri Mayasandra Prasanna,

Joyce Horn Fonteles,

Gautam Biswas; [pdf]
[bibtex]
@InProceedings{S_2026_CVPR, author = {S, Ashwin T and Prasanna, Srigowri Mayasandra and Fonteles, Joyce Horn and Biswas, Gautam}, title = {Do Emotion Recognition Models Generalize to Classrooms? Robustness and Fairness Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10883-10892} }
ConfusionBench: An Expert-Validated Benchmark for Confusion Recognition and Localization in Educational Videos: Lu Dong,

Xiao Wang,

Mark Frank,

Srirangaraj Setlur,

Venu Govindaraju,

Ifeoma Nwogu; [pdf] [arXiv]
[bibtex]
@InProceedings{Dong_2026_CVPR, author = {Dong, Lu and Wang, Xiao and Frank, Mark and Setlur, Srirangaraj and Govindaraju, Venu and Nwogu, Ifeoma}, title = {ConfusionBench: An Expert-Validated Benchmark for Confusion Recognition and Localization in Educational Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10810-10819} }
Diagnosis of Human-Object Interaction Detectors for Real-World Educational Applications: Divya Mereddy,

Ashwin Tudur Sadashiva,

Marcos Quinones-Grueiro,

Gautam Biswas; [pdf] [supp]
[bibtex]
@InProceedings{Mereddy_2026_CVPR, author = {Mereddy, Divya and Sadashiva, Ashwin Tudur and Quinones-Grueiro, Marcos and Biswas, Gautam}, title = {Diagnosis of Human-Object Interaction Detectors for Real-World Educational Applications}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10849-10858} }