CVPR 2020 Open Access Repository

Text and Documents in the Deep Learning Era

A Method for Detecting Text of Arbitrary Shapes in Natural Scenes That Improves Text Spotting: Qitong Wang,

Yi Zheng,

Margrit Betke; [pdf]
[bibtex]
@InProceedings{Wang_2020_CVPR_Workshops,
author = {Wang, Qitong and Zheng, Yi and Betke, Margrit},
title = {A Method for Detecting Text of Arbitrary Shapes in Natural Scenes That Improves Text Spotting},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
Textual Visual Semantic Dataset for Text Spotting: Ahmed Sabir,

Francesc Moreno-Noguer,

Lluis Padro; [pdf]
[bibtex]
@InProceedings{Sabir_2020_CVPR_Workshops,
author = {Sabir, Ahmed and Moreno-Noguer, Francesc and Padro, Lluis},
title = {Textual Visual Semantic Dataset for Text Spotting},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
READ: Recursive Autoencoders for Document Layout Generation: Akshay Gadi Patil,

Omri Ben-Eliezer,

Or Perel,

Hadar Averbuch-Elor; [pdf]
[bibtex]
@InProceedings{Patil_2020_CVPR_Workshops,
author = {Patil, Akshay Gadi and Ben-Eliezer, Omri and Perel, Or and Averbuch-Elor, Hadar},
title = {READ: Recursive Autoencoders for Document Layout Generation},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
On Recognizing Texts of Arbitrary Shapes With 2D Self-Attention: Junyeop Lee,

Sungrae Park,

Jeonghun Baek,

Seong Joon Oh,

Seonghyeon Kim,

Hwalsuk Lee; [pdf]
[bibtex]
@InProceedings{Lee_2020_CVPR_Workshops,
author = {Lee, Junyeop and Park, Sungrae and Baek, Jeonghun and Oh, Seong Joon and Kim, Seonghyeon and Lee, Hwalsuk},
title = {On Recognizing Texts of Arbitrary Shapes With 2D Self-Attention},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
A Large Dataset of Historical Japanese Documents With Complex Layouts: Zejiang Shen,

Kaixuan Zhang,

Melissa Dell; [pdf]
[bibtex]
@InProceedings{Shen_2020_CVPR_Workshops,
author = {Shen, Zejiang and Zhang, Kaixuan and Dell, Melissa},
title = {A Large Dataset of Historical Japanese Documents With Complex Layouts},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
An Accurate Segmentation-Based Scene Text Detector With Context Attention and Repulsive Text Border: Xi Liu,

Gaojing Zhou,

Rui Zhang,

Xiaolin Wei; [pdf]
[bibtex]
@InProceedings{Liu_2020_CVPR_Workshops,
author = {Liu, Xi and Zhou, Gaojing and Zhang, Rui and Wei, Xiaolin},
title = {An Accurate Segmentation-Based Scene Text Detector With Context Attention and Repulsive Text Border},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
Illegible Text to Readable Text: An Image-to-Image Transformation Using Conditional Sliced Wasserstein Adversarial Networks: Mostafa Karimi,

Gopalkrishna Veni,

Yen-Yun Yu; [pdf] [supp]
[bibtex]
@InProceedings{Karimi_2020_CVPR_Workshops,
author = {Karimi, Mostafa and Veni, Gopalkrishna and Yu, Yen-Yun},
title = {Illegible Text to Readable Text: An Image-to-Image Transformation Using Conditional Sliced Wasserstein Adversarial Networks},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
Optical Braille Recognition Based on Semantic Segmentation Network With Auxiliary Learning Strategy: Renqiang Li,

Hong Liu,

Xiangdong Wang,

Jianxing Xu,

Yueliang Qian; [pdf]
[bibtex]
@InProceedings{Li_2020_CVPR_Workshops,
author = {Li, Renqiang and Liu, Hong and Wang, Xiangdong and Xu, Jianxing and Qian, Yueliang},
title = {Optical Braille Recognition Based on Semantic Segmentation Network With Auxiliary Learning Strategy},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
Font-ProtoNet: Prototypical Network-Based Font Identification of Document Images in Low Data Regime: Nikita Goel,

Monika Sharma,

Lovekesh Vig; [pdf]
[bibtex]
@InProceedings{Goel_2020_CVPR_Workshops,
author = {Goel, Nikita and Sharma, Monika and Vig, Lovekesh},
title = {Font-ProtoNet: Prototypical Network-Based Font Identification of Document Images in Low Data Regime},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
Information Extraction From Document Images via FCA-Based Template Detection and Knowledge Graph Rule Induction: Mouli Rastogi,

Syed Afshan Ali,

Mrinal Rawat,

Lovekesh Vig,

Puneet Agarwal,

Gautam Shroff,

Ashwin Srinivasan; [pdf]
[bibtex]
@InProceedings{Rastogi_2020_CVPR_Workshops,
author = {Rastogi, Mouli and Ali, Syed Afshan and Rawat, Mrinal and Vig, Lovekesh and Agarwal, Puneet and Shroff, Gautam and Srinivasan, Ashwin},
title = {Information Extraction From Document Images via FCA-Based Template Detection and Knowledge Graph Rule Induction},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
An OCR for Classical Indic Documents Containing Arbitrarily Long Words: Agam Dwivedi,

Rohit Saluja,

Ravi Kiran Sarvadevabhatla; [pdf]
[bibtex]
@InProceedings{Dwivedi_2020_CVPR_Workshops,
author = {Dwivedi, Agam and Saluja, Rohit and Sarvadevabhatla, Ravi Kiran},
title = {An OCR for Classical Indic Documents Containing Arbitrarily Long Words},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
Visual and Textual Deep Feature Fusion for Document Image Classification: Souhail Bakkali,

Zuheng Ming,

Mickael Coustaty,

Marcal Rusinol; [pdf]
[bibtex]
@InProceedings{Bakkali_2020_CVPR_Workshops,
author = {Bakkali, Souhail and Ming, Zuheng and Coustaty, Mickael and Rusinol, Marcal},
title = {Visual and Textual Deep Feature Fusion for Document Image Classification},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
CLEval: Character-Level Evaluation for Text Detection and Recognition Tasks: Youngmin Baek,

Daehyun Nam,

Sungrae Park,

Junyeop Lee,

Seung Shin,

Jeonghun Baek,

Chae Young Lee,

Hwalsuk Lee; [pdf] [supp]
[bibtex]
@InProceedings{Baek_2020_CVPR_Workshops,
author = {Baek, Youngmin and Nam, Daehyun and Park, Sungrae and Lee, Junyeop and Shin, Seung and Baek, Jeonghun and Lee, Chae Young and Lee, Hwalsuk},
title = {CLEval: Character-Level Evaluation for Text Detection and Recognition Tasks},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
Recognizing Handwritten Mathematical Expressions via Paired Dual Loss Attention Network and Printed Mathematical Expressions: Anh Duc Le; [pdf]
[bibtex]
@InProceedings{Le_2020_CVPR_Workshops,
author = {Le, Anh Duc},
title = {Recognizing Handwritten Mathematical Expressions via Paired Dual Loss Attention Network and Printed Mathematical Expressions},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
Symbol Spotting on Digital Architectural Floor Plans Using a Deep Learning-Based Framework: Alireza Rezvanifar,

Melissa Cote,

Alexandra Branzan Albu; [pdf]
[bibtex]
@InProceedings{Rezvanifar_2020_CVPR_Workshops,
author = {Rezvanifar, Alireza and Cote, Melissa and Albu, Alexandra Branzan},
title = {Symbol Spotting on Digital Architectural Floor Plans Using a Deep Learning-Based Framework},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
Visual Parsing With Query-Driven Global Graph Attention (QD-GGA): Preliminary Results for Handwritten Math Formula Recognition: Mahshad Mahdavi,

Richard Zanibbi; [pdf]
[bibtex]
@InProceedings{Mahdavi_2020_CVPR_Workshops,
author = {Mahdavi, Mahshad and Zanibbi, Richard},
title = {Visual Parsing With Query-Driven Global Graph Attention (QD-GGA): Preliminary Results for Handwritten Math Formula Recognition},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}
CascadeTabNet: An Approach for End to End Table Detection and Structure Recognition From Image-Based Documents: Devashish Prasad,

Ayan Gadpal,

Kshitij Kapadni,

Manish Visave,

Kavita Sultanpure; [pdf] [supp]
[bibtex]
@InProceedings{Prasad_2020_CVPR_Workshops,
author = {Prasad, Devashish and Gadpal, Ayan and Kapadni, Kshitij and Visave, Manish and Sultanpure, Kavita},
title = {CascadeTabNet: An Approach for End to End Table Detection and Structure Recognition From Image-Based Documents},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}