aboutsummaryrefslogtreecommitdiff
path: root/core
diff options
context:
space:
mode:
authorReynold Xin <rxin@apache.org>2014-08-12 22:50:29 -0700
committerReynold Xin <rxin@apache.org>2014-08-12 22:50:29 -0700
commit676f98289dad61c091bb45bd35a2b9613b22d64a (patch)
tree56195950714160e2f9d52b6557f1560068a89ea4 /core
parentc235b83e2782cce0626ecc403c0a67e442be52c1 (diff)
downloadspark-676f98289dad61c091bb45bd35a2b9613b22d64a.tar.gz
spark-676f98289dad61c091bb45bd35a2b9613b22d64a.tar.bz2
spark-676f98289dad61c091bb45bd35a2b9613b22d64a.zip
[SPARK-2953] Allow using short names for io compression codecs
Instead of requiring "org.apache.spark.io.LZ4CompressionCodec", it is easier for users if Spark just accepts "lz4", "lzf", "snappy". Author: Reynold Xin <rxin@apache.org> Closes #1873 from rxin/compressionCodecShortForm and squashes the following commits: 9f50962 [Reynold Xin] Specify short-form compression codec names first. 63f78ee [Reynold Xin] Updated configuration documentation. 47b3848 [Reynold Xin] [SPARK-2953] Allow using short names for io compression codecs
Diffstat (limited to 'core')
-rw-r--r--core/src/main/scala/org/apache/spark/io/CompressionCodec.scala11
-rw-r--r--core/src/test/scala/org/apache/spark/io/CompressionCodecSuite.scala18
2 files changed, 27 insertions, 2 deletions
diff --git a/core/src/main/scala/org/apache/spark/io/CompressionCodec.scala b/core/src/main/scala/org/apache/spark/io/CompressionCodec.scala
index 1b66218d86..ef9c43ecf1 100644
--- a/core/src/main/scala/org/apache/spark/io/CompressionCodec.scala
+++ b/core/src/main/scala/org/apache/spark/io/CompressionCodec.scala
@@ -46,17 +46,24 @@ trait CompressionCodec {
private[spark] object CompressionCodec {
+
+ private val shortCompressionCodecNames = Map(
+ "lz4" -> classOf[LZ4CompressionCodec].getName,
+ "lzf" -> classOf[LZFCompressionCodec].getName,
+ "snappy" -> classOf[SnappyCompressionCodec].getName)
+
def createCodec(conf: SparkConf): CompressionCodec = {
createCodec(conf, conf.get("spark.io.compression.codec", DEFAULT_COMPRESSION_CODEC))
}
def createCodec(conf: SparkConf, codecName: String): CompressionCodec = {
- val ctor = Class.forName(codecName, true, Utils.getContextOrSparkClassLoader)
+ val codecClass = shortCompressionCodecNames.getOrElse(codecName.toLowerCase, codecName)
+ val ctor = Class.forName(codecClass, true, Utils.getContextOrSparkClassLoader)
.getConstructor(classOf[SparkConf])
ctor.newInstance(conf).asInstanceOf[CompressionCodec]
}
- val DEFAULT_COMPRESSION_CODEC = classOf[SnappyCompressionCodec].getName
+ val DEFAULT_COMPRESSION_CODEC = "snappy"
}
diff --git a/core/src/test/scala/org/apache/spark/io/CompressionCodecSuite.scala b/core/src/test/scala/org/apache/spark/io/CompressionCodecSuite.scala
index 3f882a724b..25be7f25c2 100644
--- a/core/src/test/scala/org/apache/spark/io/CompressionCodecSuite.scala
+++ b/core/src/test/scala/org/apache/spark/io/CompressionCodecSuite.scala
@@ -56,15 +56,33 @@ class CompressionCodecSuite extends FunSuite {
testCodec(codec)
}
+ test("lz4 compression codec short form") {
+ val codec = CompressionCodec.createCodec(conf, "lz4")
+ assert(codec.getClass === classOf[LZ4CompressionCodec])
+ testCodec(codec)
+ }
+
test("lzf compression codec") {
val codec = CompressionCodec.createCodec(conf, classOf[LZFCompressionCodec].getName)
assert(codec.getClass === classOf[LZFCompressionCodec])
testCodec(codec)
}
+ test("lzf compression codec short form") {
+ val codec = CompressionCodec.createCodec(conf, "lzf")
+ assert(codec.getClass === classOf[LZFCompressionCodec])
+ testCodec(codec)
+ }
+
test("snappy compression codec") {
val codec = CompressionCodec.createCodec(conf, classOf[SnappyCompressionCodec].getName)
assert(codec.getClass === classOf[SnappyCompressionCodec])
testCodec(codec)
}
+
+ test("snappy compression codec short form") {
+ val codec = CompressionCodec.createCodec(conf, "snappy")
+ assert(codec.getClass === classOf[SnappyCompressionCodec])
+ testCodec(codec)
+ }
}