aboutsummaryrefslogtreecommitdiff
path: root/python
diff options
context:
space:
mode:
authorJosh Rosen <joshrosen@apache.org>2014-01-23 13:05:59 -0800
committerJosh Rosen <joshrosen@apache.org>2014-01-23 13:05:59 -0800
commit0035dbbc8125af94ae27cb6f10e87aa6f5a078b1 (patch)
treec0c87e7f66a1c09b6ac62d16ae862ae798b65c0c /python
parenta2b47dae66a437f02bc053e9bde5c1472cff0fc6 (diff)
downloadspark-0035dbbc8125af94ae27cb6f10e87aa6f5a078b1.tar.gz
spark-0035dbbc8125af94ae27cb6f10e87aa6f5a078b1.tar.bz2
spark-0035dbbc8125af94ae27cb6f10e87aa6f5a078b1.zip
Fix SPARK-1034: Py4JException on PySpark Cartesian Result
Diffstat (limited to 'python')
-rw-r--r--python/pyspark/tests.py7
1 files changed, 7 insertions, 0 deletions
diff --git a/python/pyspark/tests.py b/python/pyspark/tests.py
index 7acb6eaf10..05a9f7f0d1 100644
--- a/python/pyspark/tests.py
+++ b/python/pyspark/tests.py
@@ -152,6 +152,13 @@ class TestRDDFunctions(PySparkTestCase):
raw_contents = ''.join(input(glob(tempFile.name + "/part-0000*")))
self.assertEqual(x, unicode(raw_contents.strip(), "utf-8"))
+ def test_transforming_cartesian_result(self):
+ # Regression test for SPARK-1034
+ rdd1 = self.sc.parallelize([1, 2])
+ rdd2 = self.sc.parallelize([3, 4])
+ cart = rdd1.cartesian(rdd2)
+ result = cart.map(lambda (x, y): x + y).collect()
+
class TestIO(PySparkTestCase):