x <- "A man, a plan, a canal -- Panama!"
y <- corp_text(x)
corp_get_tokens(y)
## type start end token idx
## 1: a 1 1 A 1
## 2: man 3 5 man 2
## 3: a 8 8 a 3
## 4: plan 10 13 plan 4
## 5: a 16 16 a 5
## 6: canal 18 22 canal 6
## 7: panama 27 32 Panama 7
corp_get_text(y)
## [1] "A man, a plan, a canal -- Panama!"
corp_type_lookup(y)
## type tokens
## 1: a A, a
## 2: canal canal
## 3: man man
## 4: panama Panama
## 5: plan plan
Run the code above in your browser using DataLab