aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorHarvey <h.feng@berkeley.edu>2012-08-03 12:22:07 -0700
committerHarvey <h.feng@berkeley.edu>2012-08-03 12:22:07 -0700
commit5ec13327d4041df59c3c9d842658cbecbdbf2567 (patch)
treeb8208bfff03bb4743e05fe0ef6ed657420e6762c
parent4a9c58913d0a9bd51811dedca934a2a0adbe8d37 (diff)
downloadspark-5ec13327d4041df59c3c9d842658cbecbdbf2567.tar.gz
spark-5ec13327d4041df59c3c9d842658cbecbdbf2567.tar.bz2
spark-5ec13327d4041df59c3c9d842658cbecbdbf2567.zip
Fix for partitioning when sorting in descending order
-rw-r--r--core/src/main/scala/spark/Partitioner.scala3
1 files changed, 1 insertions, 2 deletions
diff --git a/core/src/main/scala/spark/Partitioner.scala b/core/src/main/scala/spark/Partitioner.scala
index 2235a0ec3d..4ef871bbf9 100644
--- a/core/src/main/scala/spark/Partitioner.scala
+++ b/core/src/main/scala/spark/Partitioner.scala
@@ -39,8 +39,7 @@ class RangePartitioner[K <% Ordered[K]: ClassManifest, V](
val rddSize = rdd.count()
val maxSampleSize = partitions * 10.0
val frac = math.min(maxSampleSize / math.max(rddSize, 1), 1.0)
- val rddSample = rdd.sample(true, frac, 1).map(_._1).collect()
- .sortWith((x, y) => if (ascending) x < y else x > y)
+ val rddSample = rdd.sample(true, frac, 1).map(_._1).collect().sortWith(_ < _)
if (rddSample.length == 0) {
Array()
} else {