aboutsummaryrefslogtreecommitdiff
path: root/core
diff options
context:
space:
mode:
authorBouke van der Bijl <boukevanderbijl@gmail.com>2014-05-10 13:02:13 -0700
committerPatrick Wendell <pwendell@gmail.com>2014-05-10 13:02:13 -0700
commit3776f2f283842543ff766398292532c6e94221cc (patch)
treec42e92390922359f8b3fec88ad5b371014900e40 /core
parentc05d11bb307eaba40c5669da2d374c28debaa55a (diff)
downloadspark-3776f2f283842543ff766398292532c6e94221cc.tar.gz
spark-3776f2f283842543ff766398292532c6e94221cc.tar.bz2
spark-3776f2f283842543ff766398292532c6e94221cc.zip
Add Python includes to path before depickling broadcast values
This fixes https://issues.apache.org/jira/browse/SPARK-1731 by adding the Python includes to the PYTHONPATH before depickling the broadcast values @airhorns Author: Bouke van der Bijl <boukevanderbijl@gmail.com> Closes #656 from bouk/python-includes-before-broadcast and squashes the following commits: 7b0dfe4 [Bouke van der Bijl] Add Python includes to path before depickling broadcast values
Diffstat (limited to 'core')
-rw-r--r--core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala10
1 files changed, 5 insertions, 5 deletions
diff --git a/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala b/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
index fecd9762f3..388b838d78 100644
--- a/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
+++ b/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
@@ -179,6 +179,11 @@ private[spark] class PythonRDD[T: ClassTag](
dataOut.writeInt(split.index)
// sparkFilesDir
PythonRDD.writeUTF(SparkFiles.getRootDirectory, dataOut)
+ // Python includes (*.zip and *.egg files)
+ dataOut.writeInt(pythonIncludes.length)
+ for (include <- pythonIncludes) {
+ PythonRDD.writeUTF(include, dataOut)
+ }
// Broadcast variables
dataOut.writeInt(broadcastVars.length)
for (broadcast <- broadcastVars) {
@@ -186,11 +191,6 @@ private[spark] class PythonRDD[T: ClassTag](
dataOut.writeInt(broadcast.value.length)
dataOut.write(broadcast.value)
}
- // Python includes (*.zip and *.egg files)
- dataOut.writeInt(pythonIncludes.length)
- for (include <- pythonIncludes) {
- PythonRDD.writeUTF(include, dataOut)
- }
dataOut.flush()
// Serialized command:
dataOut.writeInt(command.length)