aboutsummaryrefslogtreecommitdiff
path: root/pyspark
diff options
context:
space:
mode:
authorJosh Rosen <joshrosen@eecs.berkeley.edu>2012-12-29 16:01:03 -0800
committerJosh Rosen <joshrosen@eecs.berkeley.edu>2012-12-29 16:01:03 -0800
commit59195c68ec37acf20d527189ed757397b273a207 (patch)
tree33d583fe91325fbc2bb94b27ba4ef3503e7fdda3 /pyspark
parentc5cee53f2092ee2825095a1831ca47f1c41afc2f (diff)
downloadspark-59195c68ec37acf20d527189ed757397b273a207.tar.gz
spark-59195c68ec37acf20d527189ed757397b273a207.tar.bz2
spark-59195c68ec37acf20d527189ed757397b273a207.zip
Update PySpark for compatibility with TaskContext.
Diffstat (limited to 'pyspark')
-rw-r--r--pyspark/pyspark/rdd.py3
1 files changed, 2 insertions, 1 deletions
diff --git a/pyspark/pyspark/rdd.py b/pyspark/pyspark/rdd.py
index 203f7377d2..21dda31c4e 100644
--- a/pyspark/pyspark/rdd.py
+++ b/pyspark/pyspark/rdd.py
@@ -335,9 +335,10 @@ class RDD(object):
"""
items = []
splits = self._jrdd.splits()
+ taskContext = self.ctx.jvm.spark.TaskContext(0, 0, 0)
while len(items) < num and splits:
split = splits.pop(0)
- iterator = self._jrdd.iterator(split)
+ iterator = self._jrdd.iterator(split, taskContext)
items.extend(self._collect_iterator_through_file(iterator))
return items[:num]