Text and Documents in the Deep Learning Era


A Method for Detecting Text of Arbitrary Shapes in Natural Scenes That Improves Text Spotting
Qitong Wang,
Yi Zheng,
Margrit Betke
[pdf]
[bibtex]
@InProceedings{Wang_2020_CVPR_Workshops,
author = {Wang, Qitong and Zheng, Yi and Betke, Margrit},
title = {A Method for Detecting Text of Arbitrary Shapes in Natural Scenes That Improves Text Spotting},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

Textual Visual Semantic Dataset for Text Spotting
Ahmed Sabir,
Francesc Moreno-Noguer,
Lluis Padro
[pdf]
[bibtex]
@InProceedings{Sabir_2020_CVPR_Workshops,
author = {Sabir, Ahmed and Moreno-Noguer, Francesc and Padro, Lluis},
title = {Textual Visual Semantic Dataset for Text Spotting},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

READ: Recursive Autoencoders for Document Layout Generation
Akshay Gadi Patil,
Omri Ben-Eliezer,
Or Perel,
Hadar Averbuch-Elor
[pdf]
[bibtex]
@InProceedings{Patil_2020_CVPR_Workshops,
author = {Patil, Akshay Gadi and Ben-Eliezer, Omri and Perel, Or and Averbuch-Elor, Hadar},
title = {READ: Recursive Autoencoders for Document Layout Generation},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

On Recognizing Texts of Arbitrary Shapes With 2D Self-Attention
Junyeop Lee,
Sungrae Park,
Jeonghun Baek,
Seong Joon Oh,
Seonghyeon Kim,
Hwalsuk Lee
[pdf]
[bibtex]
@InProceedings{Lee_2020_CVPR_Workshops,
author = {Lee, Junyeop and Park, Sungrae and Baek, Jeonghun and Oh, Seong Joon and Kim, Seonghyeon and Lee, Hwalsuk},
title = {On Recognizing Texts of Arbitrary Shapes With 2D Self-Attention},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

A Large Dataset of Historical Japanese Documents With Complex Layouts
Zejiang Shen,
Kaixuan Zhang,
Melissa Dell
[pdf]
[bibtex]
@InProceedings{Shen_2020_CVPR_Workshops,
author = {Shen, Zejiang and Zhang, Kaixuan and Dell, Melissa},
title = {A Large Dataset of Historical Japanese Documents With Complex Layouts},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

An Accurate Segmentation-Based Scene Text Detector With Context Attention and Repulsive Text Border
Xi Liu,
Gaojing Zhou,
Rui Zhang,
Xiaolin Wei
[pdf]
[bibtex]
@InProceedings{Liu_2020_CVPR_Workshops,
author = {Liu, Xi and Zhou, Gaojing and Zhang, Rui and Wei, Xiaolin},
title = {An Accurate Segmentation-Based Scene Text Detector With Context Attention and Repulsive Text Border},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

Illegible Text to Readable Text: An Image-to-Image Transformation Using Conditional Sliced Wasserstein Adversarial Networks
Mostafa Karimi,
Gopalkrishna Veni,
Yen-Yun Yu
[pdf] [supp]
[bibtex]
@InProceedings{Karimi_2020_CVPR_Workshops,
author = {Karimi, Mostafa and Veni, Gopalkrishna and Yu, Yen-Yun},
title = {Illegible Text to Readable Text: An Image-to-Image Transformation Using Conditional Sliced Wasserstein Adversarial Networks},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

Optical Braille Recognition Based on Semantic Segmentation Network With Auxiliary Learning Strategy
Renqiang Li,
Hong Liu,
Xiangdong Wang,
Jianxing Xu,
Yueliang Qian
[pdf]
[bibtex]
@InProceedings{Li_2020_CVPR_Workshops,
author = {Li, Renqiang and Liu, Hong and Wang, Xiangdong and Xu, Jianxing and Qian, Yueliang},
title = {Optical Braille Recognition Based on Semantic Segmentation Network With Auxiliary Learning Strategy},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

Font-ProtoNet: Prototypical Network-Based Font Identification of Document Images in Low Data Regime
Nikita Goel,
Monika Sharma,
Lovekesh Vig
[pdf]
[bibtex]
@InProceedings{Goel_2020_CVPR_Workshops,
author = {Goel, Nikita and Sharma, Monika and Vig, Lovekesh},
title = {Font-ProtoNet: Prototypical Network-Based Font Identification of Document Images in Low Data Regime},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

Information Extraction From Document Images via FCA-Based Template Detection and Knowledge Graph Rule Induction
Mouli Rastogi,
Syed Afshan Ali,
Mrinal Rawat,
Lovekesh Vig,
Puneet Agarwal,
Gautam Shroff,
Ashwin Srinivasan
[pdf]
[bibtex]
@InProceedings{Rastogi_2020_CVPR_Workshops,
author = {Rastogi, Mouli and Ali, Syed Afshan and Rawat, Mrinal and Vig, Lovekesh and Agarwal, Puneet and Shroff, Gautam and Srinivasan, Ashwin},
title = {Information Extraction From Document Images via FCA-Based Template Detection and Knowledge Graph Rule Induction},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

An OCR for Classical Indic Documents Containing Arbitrarily Long Words
Agam Dwivedi,
Rohit Saluja,
Ravi Kiran Sarvadevabhatla
[pdf]
[bibtex]
@InProceedings{Dwivedi_2020_CVPR_Workshops,
author = {Dwivedi, Agam and Saluja, Rohit and Sarvadevabhatla, Ravi Kiran},
title = {An OCR for Classical Indic Documents Containing Arbitrarily Long Words},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

Visual and Textual Deep Feature Fusion for Document Image Classification
Souhail Bakkali,
Zuheng Ming,
Mickael Coustaty,
Marcal Rusinol
[pdf]
[bibtex]
@InProceedings{Bakkali_2020_CVPR_Workshops,
author = {Bakkali, Souhail and Ming, Zuheng and Coustaty, Mickael and Rusinol, Marcal},
title = {Visual and Textual Deep Feature Fusion for Document Image Classification},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

CLEval: Character-Level Evaluation for Text Detection and Recognition Tasks
Youngmin Baek,
Daehyun Nam,
Sungrae Park,
Junyeop Lee,
Seung Shin,
Jeonghun Baek,
Chae Young Lee,
Hwalsuk Lee
[pdf] [supp]
[bibtex]
@InProceedings{Baek_2020_CVPR_Workshops,
author = {Baek, Youngmin and Nam, Daehyun and Park, Sungrae and Lee, Junyeop and Shin, Seung and Baek, Jeonghun and Lee, Chae Young and Lee, Hwalsuk},
title = {CLEval: Character-Level Evaluation for Text Detection and Recognition Tasks},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

Recognizing Handwritten Mathematical Expressions via Paired Dual Loss Attention Network and Printed Mathematical Expressions
Anh Duc Le
[pdf]
[bibtex]
@InProceedings{Le_2020_CVPR_Workshops,
author = {Le, Anh Duc},
title = {Recognizing Handwritten Mathematical Expressions via Paired Dual Loss Attention Network and Printed Mathematical Expressions},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

Symbol Spotting on Digital Architectural Floor Plans Using a Deep Learning-Based Framework
Alireza Rezvanifar,
Melissa Cote,
Alexandra Branzan Albu
[pdf]
[bibtex]
@InProceedings{Rezvanifar_2020_CVPR_Workshops,
author = {Rezvanifar, Alireza and Cote, Melissa and Albu, Alexandra Branzan},
title = {Symbol Spotting on Digital Architectural Floor Plans Using a Deep Learning-Based Framework},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

Visual Parsing With Query-Driven Global Graph Attention (QD-GGA): Preliminary Results for Handwritten Math Formula Recognition
Mahshad Mahdavi,
Richard Zanibbi
[pdf]
[bibtex]
@InProceedings{Mahdavi_2020_CVPR_Workshops,
author = {Mahdavi, Mahshad and Zanibbi, Richard},
title = {Visual Parsing With Query-Driven Global Graph Attention (QD-GGA): Preliminary Results for Handwritten Math Formula Recognition},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}

CascadeTabNet: An Approach for End to End Table Detection and Structure Recognition From Image-Based Documents
Devashish Prasad,
Ayan Gadpal,
Kshitij Kapadni,
Manish Visave,
Kavita Sultanpure
[pdf] [supp]
[bibtex]
@InProceedings{Prasad_2020_CVPR_Workshops,
author = {Prasad, Devashish and Gadpal, Ayan and Kapadni, Kshitij and Visave, Manish and Sultanpure, Kavita},
title = {CascadeTabNet: An Approach for End to End Table Detection and Structure Recognition From Image-Based Documents},
booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2020}
}