# Load example dataset
data("Data_HC_contamination", package = "dbrobust")
df <- Data_HC_contamination
# --- Quick Example ---
numeric_data <- df[1:10, 1:4] # subset for speed
d_euclid <- calculate_distances(
numeric_data,
method = "euclidean",
output_format = "matrix"
)
# \donttest{
# Load example dataset
data("Data_HC_contamination", package = "dbrobust")
df <- Data_HC_contamination[1:20,]
# Example 1: Euclidean distance (numeric variables only)
numeric_data <- df[, 1:4]
d_euclid <- calculate_distances(
numeric_data,
method = "euclidean",
output_format = "matrix"
)
# Example 2: Manhattan distance
d_manhattan <- calculate_distances(
numeric_data,
method = "manhattan",
output_format = "matrix"
)
# Example 3: Categorical distance using Matching Coefficient
categorical_data <- df[, 5:7]
d_match <- calculate_distances(
categorical_data,
method = "matching_coefficient",
output_format = "matrix"
)
# Example 4: Mixed data distance using Gower (automatic type detection, asymmetric binary)
d_gower_asym <- calculate_distances(
df,
method = "gower",
output_format = "dist",
binary_asym = TRUE
)
# Example 5: Minkowski distance with p = 3
d_minkowski <- calculate_distances(
numeric_data,
method = "minkowski",
p = 3,
output_format = "matrix"
)
# Example 6: Jaccard distance for binary variables
binary_data <- df[, 8:9]
d_jaccard <- calculate_distances(
binary_data,
method = "jaccard",
output_format = "matrix"
)
# Example 7: Mahalanobis distance
d_mahal <- calculate_distances(
numeric_data,
method = "mahalanobis",
output_format = "matrix"
)
# Example 8: Manual selection of variables for Gower distance
continuous_vars <- 1:4
binary_vars <- 8:9
categorical_vars <- 5:7
d_gower_manual <- calculate_distances(
df,
method = "gower",
output_format = "dist",
continuous_cols = continuous_vars,
binary_cols = binary_vars,
categorical_cols = categorical_vars
)
# }
Run the code above in your browser using DataLab