# create a corpus from texts
corpus(inaugTexts)
# create a corpus from texts and assign meta-data and document variables
ukimmigCorpus <- corpus(ukimmigTexts,
docvars = data.frame(party=names(ukimmigTexts)),
encTo = "UTF-16")
corpus(texts(ie2010Corpus))
# the fifth column of this csv file is the text field
mytexts <- textfile("http://www.kenbenoit.net/files/text_example.csv", textField = 5)
mycorp <- corpus(mytexts)
mycorp2 <- corpus(textfile("http://www.kenbenoit.net/files/text_example.csv", textField = "Title"))
identical(texts(mycorp), texts(mycorp2))
identical(docvars(mycorp), docvars(mycorp2))
# import a tm VCorpus
if ("tm" %in% rownames(installed.packages())) {
data(crude, package = "tm") # load in a tm example VCorpus
mytmCorpus <- corpus(crude)
summary(mytmCorpus, showmeta=TRUE)
data(acq, package = "tm")
summary(corpus(acq), 5, showmeta=TRUE)
tmCorp <- tm::VCorpus(tm::VectorSource(inaugTexts[49:57]))
quantCorp <- corpus(tmCorp)
summary(quantCorp)
}
Run the code above in your browser using DataLab