# NOT RUN {
term_stats("A rose is a rose is a rose.")
# remove punctuation and English stop words
term_stats("A rose is a rose is a rose.",
text_filter(drop_symbol = TRUE, drop = stopwords_en))
# weight the texts
term_stats(c("A rose is a rose is a rose.",
"A Rose is red, a violet is blue!"),
weights = c(100, 1))
# unigrams, bigrams, and trigrams
term_stats("A rose is a rose is a rose.", ngrams = 1:3)
# also include the type information
term_stats("A rose is a rose is a rose.", ngrams = 1:3, types = TRUE)
# }
Run the code above in your browser using DataLab