# create sample dataset
set.seed(123L)
id <- sapply(1:1000, function(x)
paste(c(sample(letters, 5), x), collapse = ""))
year <- "2018"
set.seed(123L)
count <- sample(1:10, size = 1000, replace = TRUE)
set.seed(123L)
alpha <- sample(letters, size = 1000, replace = TRUE)
set.seed(123L)
flag <- sample(c("Y", "N"), size = 1000, prob = c(0.1, 0.9), replace = TRUE)
dat <- data.frame(id, year, count, alpha, flag, stringsAsFactors = FALSE)
# structure of dataset
str(dat)
# cleansing dataset
newDat <- cleanse(dat)
# structure of cleansing dataset
str(newDat)
# cleansing dataset
newDat <- cleanse(dat, uniq = FALSE)
# structure of cleansing dataset
str(newDat)
# cleansing dataset
newDat <- cleanse(dat, uniq_thres = 0.3)
# structure of cleansing dataset
str(newDat)
# cleansing dataset
newDat <- cleanse(dat, char = FALSE)
# structure of cleansing dataset
str(newDat)
Run the code above in your browser using DataLab