aboutsummaryrefslogtreecommitdiff
path: root/python/pyspark/sql/dataframe.py
diff options
context:
space:
mode:
authoramey <amey@skytree.net>2015-06-05 13:49:33 -0700
committerReynold Xin <rxin@databricks.com>2015-06-05 13:49:33 -0700
commit356a4a9b93a1eeedb910c6bccc0abadf59e4877f (patch)
treedc940317bdc5cccadf5cefbfa0d1625c80f7517e /python/pyspark/sql/dataframe.py
parent4060526cd3b7e9ba345ce94f6e081cc1156e53ab (diff)
downloadspark-356a4a9b93a1eeedb910c6bccc0abadf59e4877f.tar.gz
spark-356a4a9b93a1eeedb910c6bccc0abadf59e4877f.tar.bz2
spark-356a4a9b93a1eeedb910c6bccc0abadf59e4877f.zip
[SPARK-7991] [PySpark] Adding support for passing lists to describe.
This is a minor change. Author: amey <amey@skytree.net> Closes #6655 from ameyc/JIRA-7991/support-passing-list-to-describe and squashes the following commits: e8a1dff [amey] Adding support for passing lists to describe.
Diffstat (limited to 'python/pyspark/sql/dataframe.py')
-rw-r--r--python/pyspark/sql/dataframe.py12
1 files changed, 12 insertions, 0 deletions
diff --git a/python/pyspark/sql/dataframe.py b/python/pyspark/sql/dataframe.py
index 03b01a1136..902504df5b 100644
--- a/python/pyspark/sql/dataframe.py
+++ b/python/pyspark/sql/dataframe.py
@@ -616,7 +616,19 @@ class DataFrame(object):
| min| 2|
| max| 5|
+-------+---+
+ >>> df.describe(['age', 'name']).show()
+ +-------+---+-----+
+ |summary|age| name|
+ +-------+---+-----+
+ | count| 2| 2|
+ | mean|3.5| null|
+ | stddev|1.5| null|
+ | min| 2|Alice|
+ | max| 5| Bob|
+ +-------+---+-----+
"""
+ if len(cols) == 1 and isinstance(cols[0], list):
+ cols = cols[0]
jdf = self._jdf.describe(self._jseq(cols))
return DataFrame(jdf, self.sql_ctx)