aboutsummaryrefslogtreecommitdiff
path: root/examples/src/main/r/ml/ml.R
diff options
context:
space:
mode:
Diffstat (limited to 'examples/src/main/r/ml/ml.R')
-rw-r--r--examples/src/main/r/ml/ml.R9
1 files changed, 5 insertions, 4 deletions
diff --git a/examples/src/main/r/ml/ml.R b/examples/src/main/r/ml/ml.R
index b96819418b..41b7867f64 100644
--- a/examples/src/main/r/ml/ml.R
+++ b/examples/src/main/r/ml/ml.R
@@ -26,11 +26,12 @@ sparkR.session(appName = "SparkR-ML-example")
############################ model read/write ##############################################
# $example on:read_write$
-irisDF <- suppressWarnings(createDataFrame(iris))
+training <- read.df("data/mllib/sample_multiclass_classification_data.txt", source = "libsvm")
# Fit a generalized linear model of family "gaussian" with spark.glm
-gaussianDF <- irisDF
-gaussianTestDF <- irisDF
-gaussianGLM <- spark.glm(gaussianDF, Sepal_Length ~ Sepal_Width + Species, family = "gaussian")
+df_list <- randomSplit(training, c(7,3), 2)
+gaussianDF <- df_list[[1]]
+gaussianTestDF <- df_list[[2]]
+gaussianGLM <- spark.glm(gaussianDF, label ~ features, family = "gaussian")
# Save and then load a fitted MLlib model
modelPath <- tempfile(pattern = "ml", fileext = ".tmp")