# create data stream with three clusters in 3-dimensional data space
stream1 <- DSD_Gaussians(k=3, d=3)
plot(stream1)
# create data stream with specified cluster positions,
# 20% noise in a given bounding box and
# with different densities (1 to 9 between the two clusters)
stream2 <- DSD_Gaussians(k=2, d=2,
mu=rbind(c(-.5,-.5), c(.5,.5)),
noise=0.2, noise_range=rbind(c(-1,1),c(-1,1)),
p=c(.1,.9))
plot(stream2)
# create 2 clusters and 2 outliers. Clusters and outliers
# are separated by Euclidean distance of 0.5 or more.
stream3 <- DSD_Gaussians(k=2, d=2,
separation_type="Euclidean", separation=0.5,
space_limit=c(0,1),
outliers=2)
plot(stream3)
# create 2 clusters and 2 outliers separated by a Mahalanobis
# distance of 6 or more.
stream4 <- DSD_Gaussians(k=2, d=2,
separation_type="Mahalanobis", separation=6,
space_limit=c(0,25), variance_limit=2,
outliers=2)
plot(stream4)
# spread outliers over 20000 data instances
stream5 <- DSD_Gaussians(k=2, d=2,
separation_type="Mahalanobis", separation=6,
space_limit=c(0,45), variance_limit=2,
outliers=20, outlier_options=list(
outlier_horizon=20000,
outlier_virtual_variance = 0.3))
plot(stream5, n=20000)
Run the code above in your browser using DataLab