aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorJunyang Qian <junyangq@databricks.com>2016-08-29 10:23:10 -0700
committerXiangrui Meng <meng@databricks.com>2016-08-29 10:23:10 -0700
commit6a0fda2c0590b455e8713da79cd5f2413e5d0f28 (patch)
treefc2a2f70686614f574b7567a0f4428b5031843b4
parent08913ce0002a80a989489a31b7353f5ec4a5849f (diff)
downloadspark-6a0fda2c0590b455e8713da79cd5f2413e5d0f28.tar.gz
spark-6a0fda2c0590b455e8713da79cd5f2413e5d0f28.tar.bz2
spark-6a0fda2c0590b455e8713da79cd5f2413e5d0f28.zip
[SPARKR][MINOR] Fix LDA doc
## What changes were proposed in this pull request? This PR tries to fix the name of the `SparkDataFrame` used in the example. Also, it gives a reference url of an example data file so that users can play with. ## How was this patch tested? Manual test. Author: Junyang Qian <junyangq@databricks.com> Closes #14853 from junyangq/SPARKR-FixLDADoc.
-rw-r--r--R/pkg/R/mllib.R10
1 files changed, 7 insertions, 3 deletions
diff --git a/R/pkg/R/mllib.R b/R/pkg/R/mllib.R
index 6808aaea8c..64d19fab7e 100644
--- a/R/pkg/R/mllib.R
+++ b/R/pkg/R/mllib.R
@@ -994,18 +994,22 @@ setMethod("spark.survreg", signature(data = "SparkDataFrame", formula = "formula
#' @export
#' @examples
#' \dontrun{
-#' text <- read.df("path/to/data", source = "libsvm")
+#' # nolint start
+#' # An example "path/to/file" can be
+#' # paste0(Sys.getenv("SPARK_HOME"), "/data/mllib/sample_lda_libsvm_data.txt")
+#' # nolint end
+#' text <- read.df("path/to/file", source = "libsvm")
#' model <- spark.lda(data = text, optimizer = "em")
#'
#' # get a summary of the model
#' summary(model)
#'
#' # compute posterior probabilities
-#' posterior <- spark.posterior(model, df)
+#' posterior <- spark.posterior(model, text)
#' showDF(posterior)
#'
#' # compute perplexity
-#' perplexity <- spark.perplexity(model, df)
+#' perplexity <- spark.perplexity(model, text)
#'
#' # save and load the model
#' path <- "path/to/model"