aboutsummaryrefslogtreecommitdiff
path: root/python/pyspark
diff options
context:
space:
mode:
authorHolden Karau <holden@us.ibm.com>2016-09-23 09:44:30 +0100
committerSean Owen <sowen@cloudera.com>2016-09-23 09:44:30 +0100
commit90d5754212425d55f992c939a2bc7d9ac6ef92b8 (patch)
tree59d36048cc576bce47d1003e35186204532bf894 /python/pyspark
parent5c5396cb4725ba5ceee26ed885e8b941d219757b (diff)
downloadspark-90d5754212425d55f992c939a2bc7d9ac6ef92b8.tar.gz
spark-90d5754212425d55f992c939a2bc7d9ac6ef92b8.tar.bz2
spark-90d5754212425d55f992c939a2bc7d9ac6ef92b8.zip
[SPARK-16861][PYSPARK][CORE] Refactor PySpark accumulator API on top of Accumulator V2
## What changes were proposed in this pull request? Move the internals of the PySpark accumulator API from the old deprecated API on top of the new accumulator API. ## How was this patch tested? The existing PySpark accumulator tests (both unit tests and doc tests at the start of accumulator.py). Author: Holden Karau <holden@us.ibm.com> Closes #14467 from holdenk/SPARK-16861-refactor-pyspark-accumulator-api.
Diffstat (limited to 'python/pyspark')
-rw-r--r--python/pyspark/context.py5
1 files changed, 2 insertions, 3 deletions
diff --git a/python/pyspark/context.py b/python/pyspark/context.py
index 7a7f59cb50..a3dd1950a5 100644
--- a/python/pyspark/context.py
+++ b/python/pyspark/context.py
@@ -173,9 +173,8 @@ class SparkContext(object):
# they will be passed back to us through a TCP server
self._accumulatorServer = accumulators._start_update_server()
(host, port) = self._accumulatorServer.server_address
- self._javaAccumulator = self._jsc.accumulator(
- self._jvm.java.util.ArrayList(),
- self._jvm.PythonAccumulatorParam(host, port))
+ self._javaAccumulator = self._jvm.PythonAccumulatorV2(host, port)
+ self._jsc.sc().register(self._javaAccumulator)
self.pythonExec = os.environ.get("PYSPARK_PYTHON", 'python')
self.pythonVer = "%d.%d" % sys.version_info[:2]