[SPARK-17702][SQL] Code generation including too many mutable states exceeds JVM size limit.

## What changes were proposed in this pull request? Code generation including too many mutable states exceeds JVM size limit to extract values from `references` into fields in the constructor. We should split the generated extractions in the constructor into smaller functions. ## How was this patch tested? I added some tests to check if the generated codes for the expressions exceed or not. Author: Takuya UESHIN <ueshin@happy-camper.st> Closes #15275 from ueshin/issues/SPARK-17702.
author: Takuya UESHIN <ueshin@happy-camper.st> 2016-10-03 21:48:58 -0700
committer: Reynold Xin <rxin@databricks.com> 2016-10-03 21:48:58 -0700
commit: b1b47274bfeba17a9e4e9acebd7385289f31f6c8 (patch)
tree: efdc4ab1c4ff848253d55188a16d427e9a0e44b4 /sql/catalyst/src/test
parent: c571cfb2d0e1e224107fc3f0c672730cae9804cb (diff)
download: spark-b1b47274bfeba17a9e4e9acebd7385289f31f6c8.tar.gz
spark-b1b47274bfeba17a9e4e9acebd7385289f31f6c8.tar.bz2
spark-b1b47274bfeba17a9e4e9acebd7385289f31f6c8.zip
1 files changed, 20 insertions, 1 deletions
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CodeGenerationSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CodeGenerationSuite.scala
index 45dcfcaf23..5588b44291 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CodeGenerationSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CodeGenerationSuite.scala
@@ -17,6 +17,8 @@
 
 package org.apache.spark.sql.catalyst.expressions
 
+import java.sql.Timestamp
+
 import org.apache.spark.SparkFunSuite
 import org.apache.spark.metrics.source.CodegenMetrics
 import org.apache.spark.sql.Row
@@ -24,7 +26,7 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.dsl.expressions._
 import org.apache.spark.sql.catalyst.expressions.codegen._
 import org.apache.spark.sql.catalyst.expressions.objects.{CreateExternalRow, GetExternalRowField, ValidateExternalType}
-import org.apache.spark.sql.catalyst.util.{ArrayBasedMapData, GenericArrayData}
+import org.apache.spark.sql.catalyst.util.{ArrayBasedMapData, DateTimeUtils, GenericArrayData}
 import org.apache.spark.sql.types._
 import org.apache.spark.unsafe.types.UTF8String
 import org.apache.spark.util.ThreadUtils
@@ -164,6 +166,23 @@ class CodeGenerationSuite extends SparkFunSuite with ExpressionEvalHelper {
     }
   }
 
+  test("SPARK-17702: split wide constructor into blocks due to JVM code size limit") {
+    val length = 5000
+    val expressions = Seq.fill(length) {
+      ToUTCTimestamp(
+        Literal.create(Timestamp.valueOf("2015-07-24 00:00:00"), TimestampType),
+        Literal.create("PST", StringType))
+    }
+    val plan = GenerateMutableProjection.generate(expressions)
+    val actual = plan(new GenericMutableRow(length)).toSeq(expressions.map(_.dataType))
+    val expected = Seq.fill(length)(
+      DateTimeUtils.fromJavaTimestamp(Timestamp.valueOf("2015-07-24 07:00:00")))
+
+    if (!checkResult(actual, expected)) {
+      fail(s"Incorrect Evaluation: expressions: $expressions, actual: $actual, expected: $expected")
+    }
+  }
+
   test("test generated safe and unsafe projection") {
     val schema = new StructType(Array(
       StructField("a", StringType, true),
author	Takuya UESHIN <ueshin@happy-camper.st>	2016-10-03 21:48:58 -0700
committer	Reynold Xin <rxin@databricks.com>	2016-10-03 21:48:58 -0700
commit	b1b47274bfeba17a9e4e9acebd7385289f31f6c8 (patch)
tree	efdc4ab1c4ff848253d55188a16d427e9a0e44b4 /sql/catalyst/src/test
parent	c571cfb2d0e1e224107fc3f0c672730cae9804cb (diff)
download	spark-b1b47274bfeba17a9e4e9acebd7385289f31f6c8.tar.gz spark-b1b47274bfeba17a9e4e9acebd7385289f31f6c8.tar.bz2 spark-b1b47274bfeba17a9e4e9acebd7385289f31f6c8.zip