aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorReynold Xin <rxin@databricks.com>2015-08-12 15:27:52 -0700
committerReynold Xin <rxin@databricks.com>2015-08-12 15:27:58 -0700
commitb28295fe0c91405ade86e215083de25ec5bb52d9 (patch)
tree4145cab355c33fd02c37078a522d95ea0078017d
parent6a7582ea2d232982c3480e7d4ee357ea45d0b303 (diff)
downloadspark-b28295fe0c91405ade86e215083de25ec5bb52d9.tar.gz
spark-b28295fe0c91405ade86e215083de25ec5bb52d9.tar.bz2
spark-b28295fe0c91405ade86e215083de25ec5bb52d9.zip
[SPARK-9907] [SQL] Python crc32 is mistakenly calling md5
Author: Reynold Xin <rxin@databricks.com> Closes #8138 from rxin/SPARK-9907. (cherry picked from commit a17384fa343628cec44437da5b80b9403ecd5838) Signed-off-by: Reynold Xin <rxin@databricks.com>
-rw-r--r--python/pyspark/sql/functions.py4
1 files changed, 2 insertions, 2 deletions
diff --git a/python/pyspark/sql/functions.py b/python/pyspark/sql/functions.py
index 95f46044d3..e98979533f 100644
--- a/python/pyspark/sql/functions.py
+++ b/python/pyspark/sql/functions.py
@@ -885,10 +885,10 @@ def crc32(col):
returns the value as a bigint.
>>> sqlContext.createDataFrame([('ABC',)], ['a']).select(crc32('a').alias('crc32')).collect()
- [Row(crc32=u'902fbdd2b1df0c4f70b4a5d23525e932')]
+ [Row(crc32=2743272264)]
"""
sc = SparkContext._active_spark_context
- return Column(sc._jvm.functions.md5(_to_java_column(col)))
+ return Column(sc._jvm.functions.crc32(_to_java_column(col)))
@ignore_unicode_prefix