diff options
author | Patrick Wendell <pwendell@gmail.com> | 2014-01-14 11:57:53 -0800 |
---|---|---|
committer | Patrick Wendell <pwendell@gmail.com> | 2014-01-14 11:57:53 -0800 |
commit | 6f965a46a9ecef9b8297200ab679fdfea1ec599e (patch) | |
tree | ee8292434b725b4681f0ed265952025393f7f305 | |
parent | b07bc02a00881822d2cb350f20dca31ddbeed54b (diff) | |
download | spark-6f965a46a9ecef9b8297200ab679fdfea1ec599e.tar.gz spark-6f965a46a9ecef9b8297200ab679fdfea1ec599e.tar.bz2 spark-6f965a46a9ecef9b8297200ab679fdfea1ec599e.zip |
Don't clone records for text files
-rw-r--r-- | core/src/main/scala/org/apache/spark/SparkContext.scala | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/core/src/main/scala/org/apache/spark/SparkContext.scala b/core/src/main/scala/org/apache/spark/SparkContext.scala index 55ac76bf63..492238905f 100644 --- a/core/src/main/scala/org/apache/spark/SparkContext.scala +++ b/core/src/main/scala/org/apache/spark/SparkContext.scala @@ -340,8 +340,8 @@ class SparkContext( * Hadoop-supported file system URI, and return it as an RDD of Strings. */ def textFile(path: String, minSplits: Int = defaultMinSplits): RDD[String] = { - hadoopFile(path, classOf[TextInputFormat], classOf[LongWritable], classOf[Text], minSplits) - .map(pair => pair._2.toString) + hadoopFile(path, classOf[TextInputFormat], classOf[LongWritable], classOf[Text], + minSplits, false).map(pair => pair._2.toString) } /** |