if (FALSE) {
df <- tokenize(
data.frame(
doc_id = seq_along(5:8),
text = ginga[5:8]
)
) |>
dplyr::group_by(doc_id) |>
dplyr::count(token) |>
dplyr::ungroup()
bind_tf_idf2(df) |>
head()
}
Run the code above in your browser using DataLab