aboutsummaryrefslogtreecommitdiff
path: root/mllib/src
diff options
context:
space:
mode:
authorReynold Xin <rxin@databricks.com>2016-01-02 22:31:39 -0800
committerReynold Xin <rxin@databricks.com>2016-01-02 22:31:39 -0800
commit513e3b092c4f3d58058ff64c861ea35cfec04205 (patch)
tree9261547956aaf05953296302da9e4fc561a7dc05 /mllib/src
parent15bd73627e04591fd13667b4838c9098342db965 (diff)
downloadspark-513e3b092c4f3d58058ff64c861ea35cfec04205.tar.gz
spark-513e3b092c4f3d58058ff64c861ea35cfec04205.tar.bz2
spark-513e3b092c4f3d58058ff64c861ea35cfec04205.zip
[SPARK-12599][MLLIB][SQL] Remove the use of callUDF in MLlib
callUDF has been deprecated. However, we do not have an alternative for users to specify the output data type without type tags. This pull request introduced a new API for that, and replaces the invocation of the deprecated callUDF with that. Author: Reynold Xin <rxin@databricks.com> Closes #10547 from rxin/SPARK-12599.
Diffstat (limited to 'mllib/src')
-rw-r--r--mllib/src/main/scala/org/apache/spark/ml/Transformer.scala4
1 files changed, 2 insertions, 2 deletions
diff --git a/mllib/src/main/scala/org/apache/spark/ml/Transformer.scala b/mllib/src/main/scala/org/apache/spark/ml/Transformer.scala
index 3c7bcf7590..1f3325ad09 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/Transformer.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/Transformer.scala
@@ -115,8 +115,8 @@ abstract class UnaryTransformer[IN, OUT, T <: UnaryTransformer[IN, OUT, T]]
override def transform(dataset: DataFrame): DataFrame = {
transformSchema(dataset.schema, logging = true)
- dataset.withColumn($(outputCol),
- callUDF(this.createTransformFunc, outputDataType, dataset($(inputCol))))
+ val transformUDF = udf(this.createTransformFunc, outputDataType)
+ dataset.withColumn($(outputCol), transformUDF(dataset($(inputCol))))
}
override def copy(extra: ParamMap): T = defaultCopy(extra)