[SPARK-13098] [SQL] remove GenericInternalRowWithSchema

This class is only used for serialization of Python DataFrame. However, we don't require internal row there, so `GenericRowWithSchema` can also do the job. Author: Wenchen Fan <wenchen@databricks.com> Closes #10992 from cloud-fan/python.
author: Wenchen Fan <wenchen@databricks.com> 2016-01-29 23:37:51 -0800
committer: Davies Liu <davies.liu@gmail.com> 2016-01-29 23:37:51 -0800
commit: dab246f7e4664d36073ec49d9df8a11c5e998cdb (patch)
tree: f909d719d3cadfc4fbcc486f15cfc4b6d07e51fa /sql
parent: e6a02c66d53f59ba2d5c1548494ae80a385f9f5c (diff)
download: spark-dab246f7e4664d36073ec49d9df8a11c5e998cdb.tar.gz
spark-dab246f7e4664d36073ec49d9df8a11c5e998cdb.tar.bz2
spark-dab246f7e4664d36073ec49d9df8a11c5e998cdb.zip
2 files changed, 5 insertions, 20 deletions
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/rows.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/rows.scala
index 387d979484..be6b2530ef 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/rows.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/rows.scala
@@ -233,18 +233,6 @@ class GenericInternalRow(private[sql] val values: Array[Any]) extends BaseGeneri
   override def copy(): GenericInternalRow = this
 }
 
-/**
- * This is used for serialization of Python DataFrame
- */
-class GenericInternalRowWithSchema(values: Array[Any], val schema: StructType)
-  extends GenericInternalRow(values) {
-
-  /** No-arg constructor for serialization. */
-  protected def this() = this(null, null)
-
-  def fieldIndex(name: String): Int = schema.fieldIndex(name)
-}
-
 class GenericMutableRow(values: Array[Any]) extends MutableRow with BaseGenericInternalRow {
   /** No-arg constructor for serialization. */
   protected def this() = this(null)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python.scala
index e3a016e18d..bf62bb05c3 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python.scala
@@ -143,7 +143,7 @@ object EvaluatePython {
         values(i) = toJava(row.get(i, struct.fields(i).dataType), struct.fields(i).dataType)
         i += 1
       }
-      new GenericInternalRowWithSchema(values, struct)
+      new GenericRowWithSchema(values, struct)
 
     case (a: ArrayData, array: ArrayType) =>
       val values = new java.util.ArrayList[Any](a.numElements())
@@ -199,10 +199,7 @@ object EvaluatePython {
 
     case (c: Long, TimestampType) => c
 
-    case (c: String, StringType) => UTF8String.fromString(c)
-    case (c, StringType) =>
-      // If we get here, c is not a string. Call toString on it.
-      UTF8String.fromString(c.toString)
+    case (c, StringType) => UTF8String.fromString(c.toString)
 
     case (c: String, BinaryType) => c.getBytes("utf-8")
     case (c, BinaryType) if c.getClass.isArray && c.getClass.getComponentType.getName == "byte" => c
@@ -263,11 +260,11 @@ object EvaluatePython {
   }
 
   /**
-   * Pickler for InternalRow
+   * Pickler for external row.
    */
   private class RowPickler extends IObjectPickler {
 
-    private val cls = classOf[GenericInternalRowWithSchema]
+    private val cls = classOf[GenericRowWithSchema]
 
     // register this to Pickler and Unpickler
     def register(): Unit = {
@@ -282,7 +279,7 @@ object EvaluatePython {
       } else {
         // it will be memorized by Pickler to save some bytes
         pickler.save(this)
-        val row = obj.asInstanceOf[GenericInternalRowWithSchema]
+        val row = obj.asInstanceOf[GenericRowWithSchema]
         // schema should always be same object for memoization
         pickler.save(row.schema)
         out.write(Opcodes.TUPLE1)
author	Wenchen Fan <wenchen@databricks.com>	2016-01-29 23:37:51 -0800
committer	Davies Liu <davies.liu@gmail.com>	2016-01-29 23:37:51 -0800
commit	dab246f7e4664d36073ec49d9df8a11c5e998cdb (patch)
tree	f909d719d3cadfc4fbcc486f15cfc4b6d07e51fa /sql
parent	e6a02c66d53f59ba2d5c1548494ae80a385f9f5c (diff)
download	spark-dab246f7e4664d36073ec49d9df8a11c5e998cdb.tar.gz spark-dab246f7e4664d36073ec49d9df8a11c5e998cdb.tar.bz2 spark-dab246f7e4664d36073ec49d9df8a11c5e998cdb.zip