aboutsummaryrefslogtreecommitdiff
path: root/sql
diff options
context:
space:
mode:
authorReynold Xin <rxin@databricks.com>2015-11-24 14:51:01 -0800
committerReynold Xin <rxin@databricks.com>2015-11-24 14:51:01 -0800
commit34ca392da7097a1fbe48cd6c3ebff51453ca26ca (patch)
tree43deb0b0078def296013c648d402aa089a7d55a2 /sql
parent58d9b260556a89a3d0832d583acafba1df7c6751 (diff)
downloadspark-34ca392da7097a1fbe48cd6c3ebff51453ca26ca.tar.gz
spark-34ca392da7097a1fbe48cd6c3ebff51453ca26ca.tar.bz2
spark-34ca392da7097a1fbe48cd6c3ebff51453ca26ca.zip
Added a line of comment to explain why the extra sort exists in pivot.
Diffstat (limited to 'sql')
-rw-r--r--sql/core/src/main/scala/org/apache/spark/sql/GroupedData.scala2
1 files changed, 1 insertions, 1 deletions
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/GroupedData.scala b/sql/core/src/main/scala/org/apache/spark/sql/GroupedData.scala
index ee7150cbbf..abd531c4ba 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/GroupedData.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/GroupedData.scala
@@ -304,7 +304,7 @@ class GroupedData protected[sql](
// Get the distinct values of the column and sort them so its consistent
val values = df.select(pivotColumn)
.distinct()
- .sort(pivotColumn)
+ .sort(pivotColumn) // ensure that the output columns are in a consistent logical order
.map(_.get(0))
.take(maxValues + 1)
.toSeq