# Feature selection on Palmer Penguins data set
# \donttest{
task = tsk("penguins")
learner = lrn("classif.rpart")
# Construct feature selection instance
instance = fsi(
task = task,
learner = learner,
resampling = rsmp("cv", folds = 3),
measures = msr("classif.ce"),
terminator = trm("evals", n_evals = 4)
)
# Choose optimization algorithm
fselector = fs("random_search", batch_size = 2)
# Run feature selection
fselector$optimize(instance)
# Subset task to optimal feature set
task$select(instance$result_feature_set)
# Train the learner with optimal feature set on the full data set
learner$train(task)
# Inspect all evaluated sets
as.data.table(instance$archive)
# }
Run the code above in your browser using DataLab