aboutsummaryrefslogtreecommitdiff
path: root/mllib/src/main/scala
diff options
context:
space:
mode:
authorWenchen Fan <wenchen@databricks.com>2016-05-18 18:06:38 -0700
committerYin Huai <yhuai@databricks.com>2016-05-18 18:06:38 -0700
commitebfe3a1f2c77e6869c3c36ba67afb7fabe6a94f5 (patch)
tree9b415f466b981db6e208801df9898944ea28dca0 /mllib/src/main/scala
parent32be51fba45f5e07a2a3520293c12dc7765a364d (diff)
downloadspark-ebfe3a1f2c77e6869c3c36ba67afb7fabe6a94f5.tar.gz
spark-ebfe3a1f2c77e6869c3c36ba67afb7fabe6a94f5.tar.bz2
spark-ebfe3a1f2c77e6869c3c36ba67afb7fabe6a94f5.zip
[SPARK-15192][SQL] null check for SparkSession.createDataFrame
## What changes were proposed in this pull request? This PR adds null check in `SparkSession.createDataFrame`, so that we can make sure the passed in rows matches the given schema. ## How was this patch tested? new tests in `DatasetSuite` Author: Wenchen Fan <wenchen@databricks.com> Closes #13008 from cloud-fan/row-encoder.
Diffstat (limited to 'mllib/src/main/scala')
-rw-r--r--mllib/src/main/scala/org/apache/spark/mllib/fpm/FPGrowth.scala2
1 files changed, 1 insertions, 1 deletions
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/fpm/FPGrowth.scala b/mllib/src/main/scala/org/apache/spark/mllib/fpm/FPGrowth.scala
index 9166faa54d..28e4966f91 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/fpm/FPGrowth.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/fpm/FPGrowth.scala
@@ -116,7 +116,7 @@ object FPGrowthModel extends Loader[FPGrowthModel[_]] {
StructField("freq", LongType))
val schema = StructType(fields)
val rowDataRDD = model.freqItemsets.map { x =>
- Row(x.items, x.freq)
+ Row(x.items.toSeq, x.freq)
}
sqlContext.createDataFrame(rowDataRDD, schema).write.parquet(Loader.dataPath(path))
}