file <- system.file("extdata", "OrderDocument_en.pdf", package = "orderanalyzer")
text <- extractText(file)
# Extracting order tables without any further information
tables <- extractTables(text)
tables[[1]]$data
# Extracting order tables with further information
tables <- extractTables(text,
entityNames = list(currencyUnits = enc2utf8(c("eur", "euro", "\u20AC")),
quantityUnits = enc2utf8(c("pcs", "pcs.")),
headerNames = enc2utf8(c("pos", "item", "quantity")),
noTableNames = enc2utf8(c("order total", "supplier number")))
)
tables[[1]]$data
# Extracting order tables from a German document
file <- system.file("extdata", "OrderDocument_de.pdf", package = "orderanalyzer")
text <- extractText(file)
tables <- extractTables(text)
tables[[1]]$data
Run the code above in your browser using DataLab