[SPARK-6917] [SQL] DecimalType is not read back when non-native type exists

cc yhuai Author: Davies Liu <davies@databricks.com> Closes #6558 from davies/decimalType and squashes the following commits: c877ca8 [Davies Liu] Update ParquetConverter.scala 48cc57c [Davies Liu] Update ParquetConverter.scala b43845c [Davies Liu] add test 3b4a94f [Davies Liu] DecimalType is not read back when non-native type exists
author: Davies Liu <davies@databricks.com> 2015-06-01 23:12:29 -0700
committer: Reynold Xin <rxin@databricks.com> 2015-06-01 23:12:29 -0700
commit: bcb47ad7718b843fbd25cd1e228a7b7e6e5b8686 (patch)
tree: 899a88594e79cd34666e5b5a868081f2f7daebf1 /sql
parent: 0221c7f0efe2512f3ae3839b83aa8abb0806d516 (diff)
download: spark-bcb47ad7718b843fbd25cd1e228a7b7e6e5b8686.tar.gz
spark-bcb47ad7718b843fbd25cd1e228a7b7e6e5b8686.tar.bz2
spark-bcb47ad7718b843fbd25cd1e228a7b7e6e5b8686.zip
2 files changed, 16 insertions, 1 deletions
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/parquet/ParquetConverter.scala b/sql/core/src/main/scala/org/apache/spark/sql/parquet/ParquetConverter.scala
index 1b4196ab0b..caa9f04553 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/parquet/ParquetConverter.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/parquet/ParquetConverter.scala
@@ -243,8 +243,10 @@ private[parquet] abstract class CatalystConverter extends GroupConverter {
   /**
    * Read a decimal value from a Parquet Binary into "dest". Only supports decimals that fit in
    * a long (i.e. precision <= 18)
+   *
+   * Returned value is needed by CatalystConverter, which doesn't reuse the Decimal object.
    */
-  protected[parquet] def readDecimal(dest: Decimal, value: Binary, ctype: DecimalType): Unit = {
+  protected[parquet] def readDecimal(dest: Decimal, value: Binary, ctype: DecimalType): Decimal = {
     val precision = ctype.precisionInfo.get.precision
     val scale = ctype.precisionInfo.get.scale
     val bytes = value.getBytes
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/parquet/ParquetQuerySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/parquet/ParquetQuerySuite.scala
index b98ba09ccf..304936fb2b 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/parquet/ParquetQuerySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/parquet/ParquetQuerySuite.scala
@@ -19,6 +19,7 @@ package org.apache.spark.sql.parquet
 
 import org.scalatest.BeforeAndAfterAll
 
+import org.apache.spark.sql.types._
 import org.apache.spark.sql.{SQLConf, QueryTest}
 import org.apache.spark.sql.catalyst.expressions.Row
 import org.apache.spark.sql.test.TestSQLContext
@@ -111,6 +112,18 @@ class ParquetQuerySuiteBase extends QueryTest with ParquetTest {
         List(Row("same", "run_5", 100)))
     }
   }
+
+  test("SPARK-6917 DecimalType should work with non-native types") {
+    val data = (1 to 10).map(i => Row(Decimal(i, 18, 0), new java.sql.Timestamp(i)))
+    val schema = StructType(List(StructField("d", DecimalType(18, 0), false),
+      StructField("time", TimestampType, false)).toArray)
+    withTempPath { file =>
+      val df = sqlContext.createDataFrame(sparkContext.parallelize(data), schema)
+      df.write.parquet(file.getCanonicalPath)
+      val df2 = sqlContext.read.parquet(file.getCanonicalPath)
+      checkAnswer(df2, df.collect().toSeq)
+    }
+  }
 }
 
 class ParquetDataSourceOnQuerySuite extends ParquetQuerySuiteBase with BeforeAndAfterAll {
author	Davies Liu <davies@databricks.com>	2015-06-01 23:12:29 -0700
committer	Reynold Xin <rxin@databricks.com>	2015-06-01 23:12:29 -0700
commit	bcb47ad7718b843fbd25cd1e228a7b7e6e5b8686 (patch)
tree	899a88594e79cd34666e5b5a868081f2f7daebf1 /sql
parent	0221c7f0efe2512f3ae3839b83aa8abb0806d516 (diff)
download	spark-bcb47ad7718b843fbd25cd1e228a7b7e6e5b8686.tar.gz spark-bcb47ad7718b843fbd25cd1e228a7b7e6e5b8686.tar.bz2 spark-bcb47ad7718b843fbd25cd1e228a7b7e6e5b8686.zip