aboutsummaryrefslogtreecommitdiff
path: root/python/pyspark/ml/feature.py
diff options
context:
space:
mode:
Diffstat (limited to 'python/pyspark/ml/feature.py')
-rw-r--r--python/pyspark/ml/feature.py15
1 files changed, 8 insertions, 7 deletions
diff --git a/python/pyspark/ml/feature.py b/python/pyspark/ml/feature.py
index 610d167f3a..1b059a7199 100644
--- a/python/pyspark/ml/feature.py
+++ b/python/pyspark/ml/feature.py
@@ -2186,13 +2186,14 @@ class Word2Vec(JavaEstimator, HasStepSize, HasMaxIter, HasSeed, HasInputCol, Has
| c|[-0.3794820010662...|
+----+--------------------+
...
- >>> model.findSynonyms("a", 2).show()
- +----+-------------------+
- |word| similarity|
- +----+-------------------+
- | b| 0.2505344027513247|
- | c|-0.6980510075367647|
- +----+-------------------+
+ >>> from pyspark.sql.functions import format_number as fmt
+ >>> model.findSynonyms("a", 2).select("word", fmt("similarity", 5).alias("similarity")).show()
+ +----+----------+
+ |word|similarity|
+ +----+----------+
+ | b| 0.25053|
+ | c| -0.69805|
+ +----+----------+
...
>>> model.transform(doc).head().model
DenseVector([0.5524, -0.4995, -0.3599, 0.0241, 0.3461])