aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorReynold Xin <rxin@databricks.com>2015-08-12 15:27:52 -0700
committerReynold Xin <rxin@databricks.com>2015-08-12 15:27:52 -0700
commita17384fa343628cec44437da5b80b9403ecd5838 (patch)
tree93983e17a24f54d62c64da86b53c0f6bbafcc6d1
parent6f60298b1d7aa97268a42eca1e3b4851a7e88cb5 (diff)
downloadspark-a17384fa343628cec44437da5b80b9403ecd5838.tar.gz
spark-a17384fa343628cec44437da5b80b9403ecd5838.tar.bz2
spark-a17384fa343628cec44437da5b80b9403ecd5838.zip
[SPARK-9907] [SQL] Python crc32 is mistakenly calling md5
Author: Reynold Xin <rxin@databricks.com> Closes #8138 from rxin/SPARK-9907.
-rw-r--r--python/pyspark/sql/functions.py4
1 files changed, 2 insertions, 2 deletions
diff --git a/python/pyspark/sql/functions.py b/python/pyspark/sql/functions.py
index 95f46044d3..e98979533f 100644
--- a/python/pyspark/sql/functions.py
+++ b/python/pyspark/sql/functions.py
@@ -885,10 +885,10 @@ def crc32(col):
returns the value as a bigint.
>>> sqlContext.createDataFrame([('ABC',)], ['a']).select(crc32('a').alias('crc32')).collect()
- [Row(crc32=u'902fbdd2b1df0c4f70b4a5d23525e932')]
+ [Row(crc32=2743272264)]
"""
sc = SparkContext._active_spark_context
- return Column(sc._jvm.functions.md5(_to_java_column(col)))
+ return Column(sc._jvm.functions.crc32(_to_java_column(col)))
@ignore_unicode_prefix