-
Notifications
You must be signed in to change notification settings - Fork 2
/
CITATION.bib
18 lines (18 loc) · 1.52 KB
/
CITATION.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
@inproceedings{10.1007/978-3-031-41734-4_26,
author = {Umer, Muhammad
and Mohsin, Muhammad Ahmed
and Ul-Hasan, Adnan
and Shafait, Faisal},
editor = {Fink, Gernot A.
and Jain, Rajiv
and Kise, Koichi
and Zanibbi, Richard},
title = {PyramidTabNet: Transformer-Based Table Recognition in Image-Based Documents},
booktitle = {Document Analysis and Recognition - ICDAR 2023},
year = {2023},
publisher = {Springer Nature Switzerland},
address = {Cham},
pages = {420--437},
abstract = {Table detection and structure recognition is an important component of document analysis systems. Deep learning-based transformer models have recently demonstrated significant success in various computer vision and document analysis tasks. In this paper, we introduce PyramidTabNet (PTN), a method that builds upon Convolution-less Pyramid Vision Transformer to detect tables in document images. Furthermore, we present a tabular image generative augmentation technique to effectively train the architecture. The proposed augmentation process consists of three steps, namely, clustering, fusion, and patching, for the generation of new document images containing tables. Our proposed pipeline demonstrates significant performance improvements for table detection on several standard datasets. Additionally, it achieves performance comparable to the state-of-the-art methods for structure recognition tasks.},
isbn = {978-3-031-41734-4}
}