texts <- list(
A = "Give a Man a Fish, and You Feed Him for a Day.
Teach a Man To Fish, and You Feed Him for a Lifetime",
B = "So Long, and Thanks for All the Fish",
C = "A very able manipulative mathematician, Fisher enjoys a real mastery
in evaluating complicated multiple integrals.")
corpus <- textmeta(meta = data.frame(id = c("A", "B", "C", "D"),
title = c("Fishing", "Don't panic!", "Sir Ronald", "Berlin"),
date = c("1885-01-02", "1979-03-04", "1951-05-06", "1967-06-02"),
additionalVariable = 1:4, stringsAsFactors = FALSE), text = texts)
corpus <- cleanTexts(corpus)
wordlist <- makeWordlist(corpus$text)
ldaPrep <- LDAprep(text = corpus$text, vocab = wordlist$words)
LDA <- LDAgen(documents = ldaPrep, K = 3L, vocab = wordlist$words, num.words = 3)
topWords(LDA$topics)
importance(LDA$topics)
Run the code above in your browser using DataLab