aboutsummaryrefslogtreecommitdiff
path: root/core/src/main/scala/spark/RDD.scala
diff options
context:
space:
mode:
Diffstat (limited to 'core/src/main/scala/spark/RDD.scala')
-rw-r--r--core/src/main/scala/spark/RDD.scala4
1 files changed, 3 insertions, 1 deletions
diff --git a/core/src/main/scala/spark/RDD.scala b/core/src/main/scala/spark/RDD.scala
index 2c3acc1b69..59e50a0b6b 100644
--- a/core/src/main/scala/spark/RDD.scala
+++ b/core/src/main/scala/spark/RDD.scala
@@ -205,9 +205,11 @@ abstract class RDD[T: ClassManifest](
/**
* Return a new RDD containing the distinct elements in this RDD.
*/
- def distinct(numSplits: Int = splits.size): RDD[T] =
+ def distinct(numSplits: Int): RDD[T] =
map(x => (x, null)).reduceByKey((x, y) => x, numSplits).map(_._1)
+ def distinct(): RDD[T] = distinct(splits.size)
+
/**
* Return a sampled subset of this RDD.
*/