-
Notifications
You must be signed in to change notification settings - Fork 4
/
paper.bib
81 lines (72 loc) · 2.36 KB
/
paper.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
@misc{amazon:2021,
title = {{Amazon Textract: Easily extract printed text, handwriting, and data from virtually any document}},
author = {{Amazon}},
year = 2021,
url = {https://aws.amazon.com/textract/},
}
@misc{edmondson:2020,
title = {{googleCloudLanguageR: Call Google's 'Natural Language' API, 'Cloud Translation' API, 'Cloud Speech' API and 'Cloud Text-to-Speech' API}},
author = {{Edmondson}, M.},
year = 2020,
url = {https://cran.r-project.org/package=googleLanguageR},
note = {R package version 0.3.0},
}
@misc{edmondson:2021,
title = {{googleCloudStorageR: Interface with Google Cloud Storage API}},
author = {{Edmondson}, M.},
year = 2021,
url = {https://cran.r-project.org/package=googleCloudStorageR},
note = {R package version 0.6.0},
}
@misc{hegghammer:2021,
title = {{daiR: An R package for OCR in Google Document AI}},
author = {{Hegghammer}, T.},
url = {https://cran.r-project.org/package=daiR},
year = 2021,
}
@article{hegghammer:2021b,
title = {{OCR with Tesseract, Amazon Textract, and Google Document AI: A Benchmarking Experiment}},
author = {{Hegghammer}, T.},
journal = {Socarxiv},
year = 2021,
month = Jun,
doi = {10.31235/osf.io/6zfvs},
url = {https://osf.io/preprints/socarxiv/6zfvs},
}
@misc{kretch:2021,
title = {{paws: Amazon Web Services Software Development Kit}},
author = {{Kretch}, M. and {Banker}, A.},
year = 2021,
url = {https://cran.r-project.org/package=paws},
note = {R package version 0.1.11},
}
@misc{ooms:2021,
title = {{tesseract: Open Source OCR Engine}},
author = {{Ooms}, J.},
year = 2021,
url = {https://cloud.r-project.org/web/packages/tesseract/index.html},
note = {R package version 4.1.1},
}
@inproceedings{santos:2019,
title = {{OCR evaluation tools for the 21st century}},
author = {{Santos}, E.A.},
booktitle = {Proceedings of the Workshop on Computational Methods for Endangered Languages},
volume = 1,
doi = {10.33011/computel.v1i.345},
year = 2019,
}
@misc{tesseract:2021,
author = {{Tesseract}},
title = {Tesseract OCR},
year = 2021,
publisher = {GitHub},
journal = {GitHub repository},
url = {https://github.com/tesseract-ocr/tesseract}
}
@article{vanguri:2021,
title = {{Customers cut document processing time and costs with DocAI solutions, now generally available}},
author = {{Vanguri}, S.},
journal = {Google Cloud Blog},
year = 2021,
month = Apr # "~21",
}