Computer Vision × Education: Building a Cross‑Community Agenda for Multimodal Vision in Classrooms


Scaffolding Human Learning by Shaping Visual Environment
Yuji Zhang,
Duo Zhou,
Bo Chen,
Aditya Chalasani,
Noah Schroeder,
H Chad Lane,
ChengXiang Zhai
[pdf]
[bibtex]
@InProceedings{Zhang_2026_CVPR, author = {Zhang, Yuji and Zhou, Duo and Chen, Bo and Chalasani, Aditya and Schroeder, Noah and Lane, H Chad and Zhai, ChengXiang}, title = {Scaffolding Human Learning by Shaping Visual Environment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10922-10931} }

From Emotion Recognition to Mind-Wandering Detection: A Comparative Analysis of Video-Based Emotion Foundation Models
Ekta Sood,
Sebastian Ricke,
Trisha Mittal,
Sidney K DMello
[pdf]
[bibtex]
@InProceedings{Sood_2026_CVPR, author = {Sood, Ekta and Ricke, Sebastian and Mittal, Trisha and DMello, Sidney K}, title = {From Emotion Recognition to Mind-Wandering Detection: A Comparative Analysis of Video-Based Emotion Foundation Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10874-10882} }

Evaluating Web-trained Facial Expression Recognition in Naturalistic Collaborative Learning
Sifatul Anindho,
Videep Venkatesha,
Nathaniel Blanchard
[pdf] [supp]
[bibtex]
@InProceedings{Anindho_2026_CVPR, author = {Anindho, Sifatul and Venkatesha, Videep and Blanchard, Nathaniel}, title = {Evaluating Web-trained Facial Expression Recognition in Naturalistic Collaborative Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10789-10798} }

InterventionLens: A Multi-Agent Framework for Detecting ASD Intervention Strategies in Parent-Child Shared Reading
Xiao Wang,
Lu Dong,
Ifeoma Nwogu,
Srirangaraj Setlur,
Venu Govindaraju
[pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2026_CVPR, author = {Wang, Xiao and Dong, Lu and Nwogu, Ifeoma and Setlur, Srirangaraj and Govindaraju, Venu}, title = {InterventionLens: A Multi-Agent Framework for Detecting ASD Intervention Strategies in Parent-Child Shared Reading}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10904-10911} }

Cross-modal Affinity-aligned Multimodal Learning Analytics for Predicting Student Collaboration Satisfaction in Game-Based Learning
Wen-Hsin Tsai,
Chia-Ming Lee,
Yuk-Ying Tung
[pdf] [arXiv]
[bibtex]
@InProceedings{Tsai_2026_CVPR, author = {Tsai, Wen-Hsin and Lee, Chia-Ming and Tung, Yuk-Ying}, title = {Cross-modal Affinity-aligned Multimodal Learning Analytics for Predicting Student Collaboration Satisfaction in Game-Based Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10893-10903} }

Context Matters: Peer-Aware Student Behavioral Engagement Measurement via VLM Action Parsing and LLM Sequence Classification
Ahmed Abdelkawy,
Ahmed Elsayed,
Asem Ali,
Aly Farag,
Thomas Tretter,
Michael McIntyre
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Abdelkawy_2026_CVPR, author = {Abdelkawy, Ahmed and Elsayed, Ahmed and Ali, Asem and Farag, Aly and Tretter, Thomas and McIntyre, Michael}, title = {Context Matters: Peer-Aware Student Behavioral Engagement Measurement via VLM Action Parsing and LLM Sequence Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10779-10788} }

CSU101: An Educational Dataset for Introductory Computer Vision
Ethan Seefried,
Changsoo Jung,
Videep Venkatesha,
Trevor Chartier,
Caleb Christian,
Jack Fitzgerald,
Mariah Bradford,
Sifatul Anindho,
Matthew Sturgeon,
Nathaniel Blanchard
[pdf]
[bibtex]
@InProceedings{Seefried_2026_CVPR, author = {Seefried, Ethan and Jung, Changsoo and Venkatesha, Videep and Chartier, Trevor and Christian, Caleb and Fitzgerald, Jack and Bradford, Mariah and Anindho, Sifatul and Sturgeon, Matthew and Blanchard, Nathaniel}, title = {CSU101: An Educational Dataset for Introductory Computer Vision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10864-10873} }

Speech-Synchronized Whiteboard Generation via VLM-Driven Structured Drawing Representations
Suraj Prasad,
Pinak Mahapatra
[pdf] [arXiv]
[bibtex]
@InProceedings{Prasad_2026_CVPR, author = {Prasad, Suraj and Mahapatra, Pinak}, title = {Speech-Synchronized Whiteboard Generation via VLM-Driven Structured Drawing Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10859-10863} }

VLMath: A Multimodal Vision-Language System for Pedagogically Aligned Math Tutoring
Mahsa Ardakani,
Arshia Eslami,
Ramtin Zand
[pdf] [supp]
[bibtex]
@InProceedings{Ardakani_2026_CVPR, author = {Ardakani, Mahsa and Eslami, Arshia and Zand, Ramtin}, title = {VLMath: A Multimodal Vision-Language System for Pedagogically Aligned Math Tutoring}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10799-10809} }

AI-Assisted Competency Assessment from Egocentric Video in Simulation-Based Nursing Education
Hanchen David Wang,
Yilin Liu,
Madison J. Mason,
Surya Chand Rayala,
Gautam Biswas,
Daniel T. Levin,
Meiyi Ma
[pdf] [supp]
[bibtex]
@InProceedings{Wang_2026_CVPR, author = {Wang, Hanchen David and Liu, Yilin and Mason, Madison J. and Rayala, Surya Chand and Biswas, Gautam and Levin, Daniel T. and Ma, Meiyi}, title = {AI-Assisted Competency Assessment from Egocentric Video in Simulation-Based Nursing Education}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10912-10921} }

MES-Bench: A Benchmark for Multimodal Elaborative Simplification and Comprehensibility Evaluation in Language Learning
Martyna Gruszka,
Risa Shinoda,
Taiki Miyanishi,
Takumi Hirose,
Nakamasa Inoue
[pdf]
[bibtex]
@InProceedings{Gruszka_2026_CVPR, author = {Gruszka, Martyna and Shinoda, Risa and Miyanishi, Taiki and Hirose, Takumi and Inoue, Nakamasa}, title = {MES-Bench: A Benchmark for Multimodal Elaborative Simplification and Comprehensibility Evaluation in Language Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10820-10829} }

ReSoFed: Reliability-Guided Model Souping for Robust Federated Learning in Heterogeneous Classroom Environments
Muhammad Rafsan Kabir,
Md Shopon,
Marina L. Gavrilova
[pdf]
[bibtex]
@InProceedings{Kabir_2026_CVPR, author = {Kabir, Muhammad Rafsan and Shopon, Md and Gavrilova, Marina L.}, title = {ReSoFed: Reliability-Guided Model Souping for Robust Federated Learning in Heterogeneous Classroom Environments}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10839-10848} }

Delta-Gated Incremental Multi-Forward-Pass Modeling for Robust Multimodal Classroom Video Understanding
Chongyu He,
Peter Youngs,
Scott Acton
[pdf]
[bibtex]
@InProceedings{He_2026_CVPR, author = {He, Chongyu and Youngs, Peter and Acton, Scott}, title = {Delta-Gated Incremental Multi-Forward-Pass Modeling for Robust Multimodal Classroom Video Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10830-10838} }

Sequence-Based Identification of First-Person Camera Wearers in Third-Person Views
Ziwei Zhao,
Xizi Wang,
Yuchen Wang,
Feng Cheng,
David Crandall
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Zhao_2026_CVPR, author = {Zhao, Ziwei and Wang, Xizi and Wang, Yuchen and Cheng, Feng and Crandall, David}, title = {Sequence-Based Identification of First-Person Camera Wearers in Third-Person Views}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10932-10943} }

Do Emotion Recognition Models Generalize to Classrooms? Robustness and Fairness Analysis
Ashwin T S,
Srigowri Mayasandra Prasanna,
Joyce Horn Fonteles,
Gautam Biswas
[pdf]
[bibtex]
@InProceedings{S_2026_CVPR, author = {S, Ashwin T and Prasanna, Srigowri Mayasandra and Fonteles, Joyce Horn and Biswas, Gautam}, title = {Do Emotion Recognition Models Generalize to Classrooms? Robustness and Fairness Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10883-10892} }

ConfusionBench: An Expert-Validated Benchmark for Confusion Recognition and Localization in Educational Videos
Lu Dong,
Xiao Wang,
Mark Frank,
Srirangaraj Setlur,
Venu Govindaraju,
Ifeoma Nwogu
[pdf] [arXiv]
[bibtex]
@InProceedings{Dong_2026_CVPR, author = {Dong, Lu and Wang, Xiao and Frank, Mark and Setlur, Srirangaraj and Govindaraju, Venu and Nwogu, Ifeoma}, title = {ConfusionBench: An Expert-Validated Benchmark for Confusion Recognition and Localization in Educational Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10810-10819} }

Diagnosis of Human-Object Interaction Detectors for Real-World Educational Applications
Divya Mereddy,
Ashwin Tudur Sadashiva,
Marcos Quinones-Grueiro,
Gautam Biswas
[pdf] [supp]
[bibtex]
@InProceedings{Mereddy_2026_CVPR, author = {Mereddy, Divya and Sadashiva, Ashwin Tudur and Quinones-Grueiro, Marcos and Biswas, Gautam}, title = {Diagnosis of Human-Object Interaction Detectors for Real-World Educational Applications}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10849-10858} }