9th Multimodal Learning and Applications Workshop
Responses Fall Short of Understanding: Revealing the Gap between Internal Representations and Responses in Visual Document Understanding-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kawasaki_2026_CVPR, author = {Kawasaki, Haruka and Tanaka, Ryota and Nishida, Kyosuke}, title = {Responses Fall Short of Understanding: Revealing the Gap between Internal Representations and Responses in Visual Document Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {7483-7493} }

