# NOT RUN {
# }
# NOT RUN {
data(Titanic)
# Find frequencies in parallel
discparcoord(Titanic, inParallel=TRUE)
# }
# NOT RUN {
# }
# NOT RUN {
data(hrdata)
input1 = list("name" = "average_montly_hours",
"partitions" = 3, "labels" = c("low", "med", "high"))
input = list(input1)
# this will discretize the data by partitioning average monthly
# hours into 3 parts called low, med, and high
hrdata = discretize(hrdata, input)
print('first few discretized tuples')
# first line should be 0.38,0.53,2,low,3,0,1,00,sales,low
head(hrdata)
print('first few most-frequent tuples')
# first line should be 0.40,0.46,2,...,11
tupleFreqs(hrdata,saveCounts=FALSE)
# account for NA values and plot with parallel coordinates
discparcoord(hrdata)
# same as above, but with scrambled columns
discparcoord(hrdata, permute=TRUE)
# same as above, but show top k values
discparcoord(hrdata, k=8)
# same as above, but group according to profession
discparcoord(hrdata, grpcategory="sales")
# }
Run the code above in your browser using DataLab