aboutsummaryrefslogtreecommitdiff
path: root/python/pyspark/context.py
diff options
context:
space:
mode:
authorPrashant Sharma <prashant.s@imaginea.com>2014-07-24 18:15:37 -0700
committerMatei Zaharia <matei@databricks.com>2014-07-24 18:15:37 -0700
commiteff9714e1c88e39e28317358ca9ec87677f121dc (patch)
tree2f0438b364a3dfa6b20f41a2e697a07a15ea715c /python/pyspark/context.py
parenta45d5480f65d2e969fc7fbd8f358b1717fb99bef (diff)
downloadspark-eff9714e1c88e39e28317358ca9ec87677f121dc.tar.gz
spark-eff9714e1c88e39e28317358ca9ec87677f121dc.tar.bz2
spark-eff9714e1c88e39e28317358ca9ec87677f121dc.zip
[SPARK-2014] Make PySpark store RDDs in MEMORY_ONLY_SER with compression by default
Author: Prashant Sharma <prashant.s@imaginea.com> Closes #1051 from ScrapCodes/SPARK-2014/pyspark-cache and squashes the following commits: f192df7 [Prashant Sharma] Code Review 2a2f43f [Prashant Sharma] [SPARK-2014] Make PySpark store RDDs in MEMORY_ONLY_SER with compression by default
Diffstat (limited to 'python/pyspark/context.py')
-rw-r--r--python/pyspark/context.py2
1 files changed, 1 insertions, 1 deletions
diff --git a/python/pyspark/context.py b/python/pyspark/context.py
index e21be0e10a..024fb88187 100644
--- a/python/pyspark/context.py
+++ b/python/pyspark/context.py
@@ -101,7 +101,7 @@ class SparkContext(object):
else:
self.serializer = BatchedSerializer(self._unbatched_serializer,
batchSize)
-
+ self._conf.setIfMissing("spark.rdd.compress", "true")
# Set any parameters passed directly to us on the conf
if master:
self._conf.setMaster(master)