[SPARK-6948] [MLLIB] compress vectors in VectorAssembler

The compression is based on storage. brkyvz Author: Xiangrui Meng <meng@databricks.com> Closes #5985 from mengxr/SPARK-6948 and squashes the following commits: df56a00 [Xiangrui Meng] update python tests 6d90d45 [Xiangrui Meng] compress vectors in VectorAssembler
author: Xiangrui Meng <meng@databricks.com> 2015-05-07 15:45:37 -0700
committer: Xiangrui Meng <meng@databricks.com> 2015-05-07 15:45:37 -0700
commit: e43803b8f477b2c8d28836ac163cb54328d13f1a (patch)
tree: 3da358b42d71c182cf1ff262dc0ec509124d3b39 /python
parent: 658a478d3f86456df09d0fbb1ba438fb36d8725c (diff)
download: spark-e43803b8f477b2c8d28836ac163cb54328d13f1a.tar.gz
spark-e43803b8f477b2c8d28836ac163cb54328d13f1a.tar.bz2
spark-e43803b8f477b2c8d28836ac163cb54328d13f1a.zip
1 files changed, 3 insertions, 3 deletions
diff --git a/python/pyspark/ml/feature.py b/python/pyspark/ml/feature.py
index 8a0fdddd2d..705a368192 100644
--- a/python/pyspark/ml/feature.py
+++ b/python/pyspark/ml/feature.py
@@ -121,12 +121,12 @@ class VectorAssembler(JavaTransformer, HasInputCols, HasOutputCol):
     >>> df = sc.parallelize([Row(a=1, b=0, c=3)]).toDF()
     >>> vecAssembler = VectorAssembler(inputCols=["a", "b", "c"], outputCol="features")
     >>> vecAssembler.transform(df).head().features
-    SparseVector(3, {0: 1.0, 2: 3.0})
+    DenseVector([1.0, 0.0, 3.0])
     >>> vecAssembler.setParams(outputCol="freqs").transform(df).head().freqs
-    SparseVector(3, {0: 1.0, 2: 3.0})
+    DenseVector([1.0, 0.0, 3.0])
     >>> params = {vecAssembler.inputCols: ["b", "a"], vecAssembler.outputCol: "vector"}
     >>> vecAssembler.transform(df, params).head().vector
-    SparseVector(2, {1: 1.0})
+    DenseVector([0.0, 1.0])
     """
 
     _java_class = "org.apache.spark.ml.feature.VectorAssembler"
author	Xiangrui Meng <meng@databricks.com>	2015-05-07 15:45:37 -0700
committer	Xiangrui Meng <meng@databricks.com>	2015-05-07 15:45:37 -0700
commit	e43803b8f477b2c8d28836ac163cb54328d13f1a (patch)
tree	3da358b42d71c182cf1ff262dc0ec509124d3b39 /python
parent	658a478d3f86456df09d0fbb1ba438fb36d8725c (diff)
download	spark-e43803b8f477b2c8d28836ac163cb54328d13f1a.tar.gz spark-e43803b8f477b2c8d28836ac163cb54328d13f1a.tar.bz2 spark-e43803b8f477b2c8d28836ac163cb54328d13f1a.zip