diff --git a/examples/src/main/r/ml/ml.R b/examples/src/main/r/ml/ml.R index d601590c22a8945bba4cf634e97768eaf2f2ace6..05f5199aebe1572264f5f061fee04e3cf8a2811a 100644 --- a/examples/src/main/r/ml/ml.R +++ b/examples/src/main/r/ml/ml.R @@ -49,17 +49,16 @@ unlink(modelPath) ############################ fit models with spark.lapply ##################################### # Perform distributed training of multiple models with spark.lapply -costs <- exp(seq(from = log(1), to = log(1000), length.out = 5)) -train <- function(cost) { - stopifnot(requireNamespace("e1071", quietly = TRUE)) - model <- e1071::svm(Species ~ ., data = iris, cost = cost) - summary(model) +algorithms <- c("Hartigan-Wong", "Lloyd", "MacQueen") +train <- function(algorithm) { + model <- kmeans(x = iris[1:4], centers = 3, algorithm = algorithm) + model$withinss } -model.summaries <- spark.lapply(costs, train) +model.withinss <- spark.lapply(algorithms, train) -# Print the summary of each model -print(model.summaries) +# Print the within-cluster sum of squares for each model +print(model.withinss) # Stop the SparkSession now sparkR.session.stop()