9th Multimodal Learning and Applications Workshop


Responses Fall Short of Understanding: Revealing the Gap between Internal Representations and Responses in Visual Document Understanding
Haruka Kawasaki,
Ryota Tanaka,
Kyosuke Nishida
[pdf] [arXiv]
[bibtex]
@InProceedings{Kawasaki_2026_CVPR, author = {Kawasaki, Haruka and Tanaka, Ryota and Nishida, Kyosuke}, title = {Responses Fall Short of Understanding: Revealing the Gap between Internal Representations and Responses in Visual Document Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {7483-7493} }