added gitignore & tidyr
This commit is contained in:
parent
852e549f70
commit
0ff660598a
|
@ -0,0 +1,7 @@
|
|||
.Rproj.user
|
||||
.Rhistory
|
||||
.RData
|
||||
.Ruserdata
|
||||
|
||||
*.jpg
|
||||
*.csv
|
|
@ -0,0 +1,13 @@
|
|||
Version: 1.0
|
||||
|
||||
RestoreWorkspace: Default
|
||||
SaveWorkspace: Default
|
||||
AlwaysSaveHistory: Default
|
||||
|
||||
EnableCodeIndexing: Yes
|
||||
UseSpacesForTab: Yes
|
||||
NumSpacesForTab: 2
|
||||
Encoding: UTF-8
|
||||
|
||||
RnwWeave: Sweave
|
||||
LaTeX: pdfLaTeX
|
|
@ -3,7 +3,7 @@
|
|||
# (c) 2019 The Field Museum - MIT License (https://opensource.org/licenses/MIT)
|
||||
# https://github.com/fieldmuseum/Collections-OCR
|
||||
|
||||
|
||||
library(tidyr)
|
||||
library(magick)
|
||||
library(stringr)
|
||||
library(tesseract)
|
||||
|
@ -53,6 +53,7 @@ ocrText <- separate(imagesOCR, text,
|
|||
sep = "\n",
|
||||
extra = "merge", fill = "right")
|
||||
|
||||
|
||||
# export CSV
|
||||
write.csv(ocrText,
|
||||
paste0("ocrText-",
|
||||
|
|
Loading…
Reference in New Issue