aboutsummaryrefslogtreecommitdiff
path: root/mllib/src/test
diff options
context:
space:
mode:
authorXiangrui Meng <meng@databricks.com>2015-05-20 23:38:58 -0700
committerXiangrui Meng <meng@databricks.com>2015-05-20 23:39:06 -0700
commit64762444e712189701663da272cab6c657368883 (patch)
tree23e43192749a3330789b7483597e6b34976ea399 /mllib/src/test
parentb0e7c6633811f08c2454a8563ae13809a667ca60 (diff)
downloadspark-64762444e712189701663da272cab6c657368883.tar.gz
spark-64762444e712189701663da272cab6c657368883.tar.bz2
spark-64762444e712189701663da272cab6c657368883.zip
[SPARK-7753] [MLLIB] Update KernelDensity API
Update `KernelDensity` API to make it extensible to different kernels in the future. `bandwidth` is used instead of `standardDeviation`. The static `kernelDensity` method is removed from `Statistics`. The implementation is updated using BLAS, while the algorithm remains the same. sryza srowen Author: Xiangrui Meng <meng@databricks.com> Closes #6279 from mengxr/SPARK-7753 and squashes the following commits: 4cdfadc [Xiangrui Meng] add example code in the doc 767fd5a [Xiangrui Meng] update KernelDensity API (cherry picked from commit 947ea1cf5f6986aa687631d6cf9f0fb974ee7caf) Signed-off-by: Xiangrui Meng <meng@databricks.com>
Diffstat (limited to 'mllib/src/test')
-rw-r--r--mllib/src/test/scala/org/apache/spark/mllib/stat/KernelDensitySuite.scala7
1 files changed, 3 insertions, 4 deletions
diff --git a/mllib/src/test/scala/org/apache/spark/mllib/stat/KernelDensitySuite.scala b/mllib/src/test/scala/org/apache/spark/mllib/stat/KernelDensitySuite.scala
index 16ecae23dd..14bb1cebf0 100644
--- a/mllib/src/test/scala/org/apache/spark/mllib/stat/KernelDensitySuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/mllib/stat/KernelDensitySuite.scala
@@ -17,9 +17,8 @@
package org.apache.spark.mllib.stat
-import org.scalatest.FunSuite
-
import org.apache.commons.math3.distribution.NormalDistribution
+import org.scalatest.FunSuite
import org.apache.spark.mllib.util.MLlibTestSparkContext
@@ -27,7 +26,7 @@ class KernelDensitySuite extends FunSuite with MLlibTestSparkContext {
test("kernel density single sample") {
val rdd = sc.parallelize(Array(5.0))
val evaluationPoints = Array(5.0, 6.0)
- val densities = KernelDensity.estimate(rdd, 3.0, evaluationPoints)
+ val densities = new KernelDensity().setSample(rdd).setBandwidth(3.0).estimate(evaluationPoints)
val normal = new NormalDistribution(5.0, 3.0)
val acceptableErr = 1e-6
assert(densities(0) - normal.density(5.0) < acceptableErr)
@@ -37,7 +36,7 @@ class KernelDensitySuite extends FunSuite with MLlibTestSparkContext {
test("kernel density multiple samples") {
val rdd = sc.parallelize(Array(5.0, 10.0))
val evaluationPoints = Array(5.0, 6.0)
- val densities = KernelDensity.estimate(rdd, 3.0, evaluationPoints)
+ val densities = new KernelDensity().setSample(rdd).setBandwidth(3.0).estimate(evaluationPoints)
val normal1 = new NormalDistribution(5.0, 3.0)
val normal2 = new NormalDistribution(10.0, 3.0)
val acceptableErr = 1e-6