aboutsummaryrefslogtreecommitdiff
path: root/python/pyspark/rdd.py
diff options
context:
space:
mode:
authorDavies Liu <davies@databricks.com>2015-02-24 14:50:00 -0800
committerJoseph K. Bradley <joseph@databricks.com>2015-02-24 14:50:00 -0800
commitda505e59274d1c838653c1109db65ad374e65304 (patch)
tree4217693d3d266655bd800f8ca678aa5e39e68a93 /python/pyspark/rdd.py
parenta2b9137923e0ba328da8fff2fbbfcf2abf50b033 (diff)
downloadspark-da505e59274d1c838653c1109db65ad374e65304.tar.gz
spark-da505e59274d1c838653c1109db65ad374e65304.tar.bz2
spark-da505e59274d1c838653c1109db65ad374e65304.zip
[SPARK-5973] [PySpark] fix zip with two RDDs with AutoBatchedSerializer
Author: Davies Liu <davies@databricks.com> Closes #4745 from davies/fix_zip and squashes the following commits: 2124b2c [Davies Liu] Update tests.py b5c828f [Davies Liu] increase the number of records c1e40fd [Davies Liu] fix zip with two RDDs with AutoBatchedSerializer
Diffstat (limited to 'python/pyspark/rdd.py')
-rw-r--r--python/pyspark/rdd.py2
1 files changed, 1 insertions, 1 deletions
diff --git a/python/pyspark/rdd.py b/python/pyspark/rdd.py
index ba2347ae76..d3148de6f4 100644
--- a/python/pyspark/rdd.py
+++ b/python/pyspark/rdd.py
@@ -1950,7 +1950,7 @@ class RDD(object):
my_batch = get_batch_size(self._jrdd_deserializer)
other_batch = get_batch_size(other._jrdd_deserializer)
- if my_batch != other_batch:
+ if my_batch != other_batch or not my_batch:
# use the smallest batchSize for both of them
batchSize = min(my_batch, other_batch)
if batchSize <= 0: