[SPARK-11555] spark on yarn spark-class --num-workers doesn't work

I tested the various options with both spark-submit and spark-class of specifying number of executors in both client and cluster mode where it applied. --num-workers, --num-executors, spark.executor.instances, SPARK_EXECUTOR_INSTANCES, default nothing supplied Author: Thomas Graves <tgraves@staydecay.corp.gq1.yahoo.com> Closes #9523 from tgravescs/SPARK-11555.
author: Thomas Graves <tgraves@staydecay.corp.gq1.yahoo.com> 2015-11-06 15:24:33 -0800
committer: Marcelo Vanzin <vanzin@cloudera.com> 2015-11-06 15:24:33 -0800
commit: f6680cdc5d2912dea9768ef5c3e2cc101b06daf8 (patch)
tree: 0087cc43a0bbae9f3387288dc0f21adb5a2d61a2 /yarn/src/main
parent: c447c9d54603890db7399fb80adc9fae40b71f64 (diff)
download: spark-f6680cdc5d2912dea9768ef5c3e2cc101b06daf8.tar.gz
spark-f6680cdc5d2912dea9768ef5c3e2cc101b06daf8.tar.bz2
spark-f6680cdc5d2912dea9768ef5c3e2cc101b06daf8.zip
2 files changed, 6 insertions, 3 deletions
diff --git a/yarn/src/main/scala/org/apache/spark/deploy/yarn/ClientArguments.scala b/yarn/src/main/scala/org/apache/spark/deploy/yarn/ClientArguments.scala
index 1165061db2..a9f4374357 100644
--- a/yarn/src/main/scala/org/apache/spark/deploy/yarn/ClientArguments.scala
+++ b/yarn/src/main/scala/org/apache/spark/deploy/yarn/ClientArguments.scala
@@ -81,7 +81,7 @@ private[spark] class ClientArguments(args: Array[String], sparkConf: SparkConf)
       .orNull
     // If dynamic allocation is enabled, start at the configured initial number of executors.
     // Default to minExecutors if no initialExecutors is set.
-    numExecutors = YarnSparkHadoopUtil.getInitialTargetExecutorNumber(sparkConf)
+    numExecutors = YarnSparkHadoopUtil.getInitialTargetExecutorNumber(sparkConf, numExecutors)
     principal = Option(principal)
       .orElse(sparkConf.getOption("spark.yarn.principal"))
       .orNull
diff --git a/yarn/src/main/scala/org/apache/spark/deploy/yarn/YarnSparkHadoopUtil.scala b/yarn/src/main/scala/org/apache/spark/deploy/yarn/YarnSparkHadoopUtil.scala
index 561ad79ee0..a290ebeec9 100644
--- a/yarn/src/main/scala/org/apache/spark/deploy/yarn/YarnSparkHadoopUtil.scala
+++ b/yarn/src/main/scala/org/apache/spark/deploy/yarn/YarnSparkHadoopUtil.scala
@@ -392,8 +392,11 @@ object YarnSparkHadoopUtil {
   /**
    * Getting the initial target number of executors depends on whether dynamic allocation is
    * enabled.
+   * If not using dynamic allocation it gets the number of executors reqeusted by the user.
    */
-  def getInitialTargetExecutorNumber(conf: SparkConf): Int = {
+  def getInitialTargetExecutorNumber(
+      conf: SparkConf,
+      numExecutors: Int = DEFAULT_NUMBER_EXECUTORS): Int = {
     if (Utils.isDynamicAllocationEnabled(conf)) {
       val minNumExecutors = conf.getInt("spark.dynamicAllocation.minExecutors", 0)
       val initialNumExecutors =
@@ -406,7 +409,7 @@ object YarnSparkHadoopUtil {
       initialNumExecutors
     } else {
       val targetNumExecutors =
-        sys.env.get("SPARK_EXECUTOR_INSTANCES").map(_.toInt).getOrElse(DEFAULT_NUMBER_EXECUTORS)
+        sys.env.get("SPARK_EXECUTOR_INSTANCES").map(_.toInt).getOrElse(numExecutors)
       // System property can override environment variable.
       conf.getInt("spark.executor.instances", targetNumExecutors)
     }
author	Thomas Graves <tgraves@staydecay.corp.gq1.yahoo.com>	2015-11-06 15:24:33 -0800
committer	Marcelo Vanzin <vanzin@cloudera.com>	2015-11-06 15:24:33 -0800
commit	f6680cdc5d2912dea9768ef5c3e2cc101b06daf8 (patch)
tree	0087cc43a0bbae9f3387288dc0f21adb5a2d61a2 /yarn/src/main
parent	c447c9d54603890db7399fb80adc9fae40b71f64 (diff)
download	spark-f6680cdc5d2912dea9768ef5c3e2cc101b06daf8.tar.gz spark-f6680cdc5d2912dea9768ef5c3e2cc101b06daf8.tar.bz2 spark-f6680cdc5d2912dea9768ef5c3e2cc101b06daf8.zip