Computer Vision × Education: Building a Cross‑Community Agenda for Multimodal Vision in Classrooms
Scaffolding Human Learning by Shaping Visual Environment-
[pdf]
[bibtex]@InProceedings{Zhang_2026_CVPR, author = {Zhang, Yuji and Zhou, Duo and Chen, Bo and Chalasani, Aditya and Schroeder, Noah and Lane, H Chad and Zhai, ChengXiang}, title = {Scaffolding Human Learning by Shaping Visual Environment}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10922-10931} }
From Emotion Recognition to Mind-Wandering Detection: A Comparative Analysis of Video-Based Emotion Foundation Models-
[pdf]
[bibtex]@InProceedings{Sood_2026_CVPR, author = {Sood, Ekta and Ricke, Sebastian and Mittal, Trisha and DMello, Sidney K}, title = {From Emotion Recognition to Mind-Wandering Detection: A Comparative Analysis of Video-Based Emotion Foundation Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10874-10882} }
Evaluating Web-trained Facial Expression Recognition in Naturalistic Collaborative Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Anindho_2026_CVPR, author = {Anindho, Sifatul and Venkatesha, Videep and Blanchard, Nathaniel}, title = {Evaluating Web-trained Facial Expression Recognition in Naturalistic Collaborative Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10789-10798} }
InterventionLens: A Multi-Agent Framework for Detecting ASD Intervention Strategies in Parent-Child Shared Reading-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2026_CVPR, author = {Wang, Xiao and Dong, Lu and Nwogu, Ifeoma and Setlur, Srirangaraj and Govindaraju, Venu}, title = {InterventionLens: A Multi-Agent Framework for Detecting ASD Intervention Strategies in Parent-Child Shared Reading}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10904-10911} }
Cross-modal Affinity-aligned Multimodal Learning Analytics for Predicting Student Collaboration Satisfaction in Game-Based Learning-
[pdf]
[arXiv]
[bibtex]@InProceedings{Tsai_2026_CVPR, author = {Tsai, Wen-Hsin and Lee, Chia-Ming and Tung, Yuk-Ying}, title = {Cross-modal Affinity-aligned Multimodal Learning Analytics for Predicting Student Collaboration Satisfaction in Game-Based Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10893-10903} }
Context Matters: Peer-Aware Student Behavioral Engagement Measurement via VLM Action Parsing and LLM Sequence Classification-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Abdelkawy_2026_CVPR, author = {Abdelkawy, Ahmed and Elsayed, Ahmed and Ali, Asem and Farag, Aly and Tretter, Thomas and McIntyre, Michael}, title = {Context Matters: Peer-Aware Student Behavioral Engagement Measurement via VLM Action Parsing and LLM Sequence Classification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10779-10788} }
CSU101: An Educational Dataset for Introductory Computer Vision-
[pdf]
[bibtex]@InProceedings{Seefried_2026_CVPR, author = {Seefried, Ethan and Jung, Changsoo and Venkatesha, Videep and Chartier, Trevor and Christian, Caleb and Fitzgerald, Jack and Bradford, Mariah and Anindho, Sifatul and Sturgeon, Matthew and Blanchard, Nathaniel}, title = {CSU101: An Educational Dataset for Introductory Computer Vision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10864-10873} }
Speech-Synchronized Whiteboard Generation via VLM-Driven Structured Drawing Representations-
[pdf]
[arXiv]
[bibtex]@InProceedings{Prasad_2026_CVPR, author = {Prasad, Suraj and Mahapatra, Pinak}, title = {Speech-Synchronized Whiteboard Generation via VLM-Driven Structured Drawing Representations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10859-10863} }
VLMath: A Multimodal Vision-Language System for Pedagogically Aligned Math Tutoring-
[pdf]
[supp]
[bibtex]@InProceedings{Ardakani_2026_CVPR, author = {Ardakani, Mahsa and Eslami, Arshia and Zand, Ramtin}, title = {VLMath: A Multimodal Vision-Language System for Pedagogically Aligned Math Tutoring}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10799-10809} }
AI-Assisted Competency Assessment from Egocentric Video in Simulation-Based Nursing Education-
[pdf]
[supp]
[bibtex]@InProceedings{Wang_2026_CVPR, author = {Wang, Hanchen David and Liu, Yilin and Mason, Madison J. and Rayala, Surya Chand and Biswas, Gautam and Levin, Daniel T. and Ma, Meiyi}, title = {AI-Assisted Competency Assessment from Egocentric Video in Simulation-Based Nursing Education}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10912-10921} }
MES-Bench: A Benchmark for Multimodal Elaborative Simplification and Comprehensibility Evaluation in Language Learning-
[pdf]
[bibtex]@InProceedings{Gruszka_2026_CVPR, author = {Gruszka, Martyna and Shinoda, Risa and Miyanishi, Taiki and Hirose, Takumi and Inoue, Nakamasa}, title = {MES-Bench: A Benchmark for Multimodal Elaborative Simplification and Comprehensibility Evaluation in Language Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10820-10829} }
ReSoFed: Reliability-Guided Model Souping for Robust Federated Learning in Heterogeneous Classroom Environments-
[pdf]
[bibtex]@InProceedings{Kabir_2026_CVPR, author = {Kabir, Muhammad Rafsan and Shopon, Md and Gavrilova, Marina L.}, title = {ReSoFed: Reliability-Guided Model Souping for Robust Federated Learning in Heterogeneous Classroom Environments}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10839-10848} }
Delta-Gated Incremental Multi-Forward-Pass Modeling for Robust Multimodal Classroom Video Understanding-
[pdf]
[bibtex]@InProceedings{He_2026_CVPR, author = {He, Chongyu and Youngs, Peter and Acton, Scott}, title = {Delta-Gated Incremental Multi-Forward-Pass Modeling for Robust Multimodal Classroom Video Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10830-10838} }
Sequence-Based Identification of First-Person Camera Wearers in Third-Person Views-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Zhao_2026_CVPR, author = {Zhao, Ziwei and Wang, Xizi and Wang, Yuchen and Cheng, Feng and Crandall, David}, title = {Sequence-Based Identification of First-Person Camera Wearers in Third-Person Views}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10932-10943} }
Do Emotion Recognition Models Generalize to Classrooms? Robustness and Fairness Analysis-
[pdf]
[bibtex]@InProceedings{S_2026_CVPR, author = {S, Ashwin T and Prasanna, Srigowri Mayasandra and Fonteles, Joyce Horn and Biswas, Gautam}, title = {Do Emotion Recognition Models Generalize to Classrooms? Robustness and Fairness Analysis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10883-10892} }
ConfusionBench: An Expert-Validated Benchmark for Confusion Recognition and Localization in Educational Videos-
[pdf]
[arXiv]
[bibtex]@InProceedings{Dong_2026_CVPR, author = {Dong, Lu and Wang, Xiao and Frank, Mark and Setlur, Srirangaraj and Govindaraju, Venu and Nwogu, Ifeoma}, title = {ConfusionBench: An Expert-Validated Benchmark for Confusion Recognition and Localization in Educational Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10810-10819} }
Diagnosis of Human-Object Interaction Detectors for Real-World Educational Applications-
[pdf]
[supp]
[bibtex]@InProceedings{Mereddy_2026_CVPR, author = {Mereddy, Divya and Sadashiva, Ashwin Tudur and Quinones-Grueiro, Marcos and Biswas, Gautam}, title = {Diagnosis of Human-Object Interaction Detectors for Real-World Educational Applications}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {10849-10858} }

