# Create example corpus and data
corp <- data_corpus_inaugural[1:5]
# Create data to join with document names
doc_data <- data.frame(
docname = c("1789-Washington", "1793-Washington", "1797-Adams"),
century = c(18, 18, 18),
speech_number = c(1, 2, 1)
)
# Join using docname - matches docnames(corp) to doc_data$docname
left_join(corp, doc_data, by = "docname") %>%
summary()
# Join using different column names with named vector
doc_data2 <- data.frame(
doc_id = c("1789-Washington", "1793-Washington"),
rating = c(5, 4)
)
left_join(corp, doc_data2, by = c("docname" = "doc_id")) %>%
summary()
# Regular join on existing docvars
year_info <- data.frame(
Year = c(1789, 1793, 1797, 1801, 1805),
decade = c("1780s", "1790s", "1790s", "1800s", "1800s")
)
left_join(corp, year_info, by = "Year") %>%
summary()
Run the code above in your browser using DataLab