aboutsummaryrefslogtreecommitdiff
path: root/python/pyspark/sql.py
diff options
context:
space:
mode:
Diffstat (limited to 'python/pyspark/sql.py')
-rw-r--r--python/pyspark/sql.py5
1 files changed, 4 insertions, 1 deletions
diff --git a/python/pyspark/sql.py b/python/pyspark/sql.py
index f2001afae4..fa4b9c7b68 100644
--- a/python/pyspark/sql.py
+++ b/python/pyspark/sql.py
@@ -323,7 +323,10 @@ class SchemaRDD(RDD):
def count(self):
"""
- Return the number of elements in this RDD.
+ Return the number of elements in this RDD. Unlike the base RDD
+ implementation of count, this implementation leverages the query
+ optimizer to compute the count on the SchemaRDD, which supports
+ features such as filter pushdown.
>>> srdd = sqlCtx.inferSchema(rdd)
>>> srdd.count()