summaryrefslogtreecommitdiff
path: root/site/releases/spark-release-1-0-1.html
diff options
context:
space:
mode:
authorPatrick Wendell <pwendell@apache.org>2014-07-12 00:45:34 +0000
committerPatrick Wendell <pwendell@apache.org>2014-07-12 00:45:34 +0000
commit7062d6dcaa2666c0370d79290e508d1b450ebb75 (patch)
tree5f08b52380a68ddaad64a07d0db6d19d035bda63 /site/releases/spark-release-1-0-1.html
parent22d1043d6976a4b431c30c261310f4ba1cb3650e (diff)
downloadspark-website-7062d6dcaa2666c0370d79290e508d1b450ebb75.tar.gz
spark-website-7062d6dcaa2666c0370d79290e508d1b450ebb75.tar.bz2
spark-website-7062d6dcaa2666c0370d79290e508d1b450ebb75.zip
New files for Spark 1.0.1 release.
Diffstat (limited to 'site/releases/spark-release-1-0-1.html')
-rw-r--r--site/releases/spark-release-1-0-1.html319
1 files changed, 319 insertions, 0 deletions
diff --git a/site/releases/spark-release-1-0-1.html b/site/releases/spark-release-1-0-1.html
new file mode 100644
index 000000000..077499e6f
--- /dev/null
+++ b/site/releases/spark-release-1-0-1.html
@@ -0,0 +1,319 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+ <meta charset="utf-8">
+ <meta http-equiv="X-UA-Compatible" content="IE=edge">
+ <meta name="viewport" content="width=device-width, initial-scale=1.0">
+
+ <title>
+ Spark Release 1.0.1 | Apache Spark
+
+ </title>
+
+
+
+ <!-- Bootstrap core CSS -->
+ <link href="/css/cerulean.min.css" rel="stylesheet">
+ <link href="/css/custom.css" rel="stylesheet">
+
+ <script type="text/javascript">
+ <!-- Google Analytics initialization -->
+ var _gaq = _gaq || [];
+ _gaq.push(['_setAccount', 'UA-32518208-2']);
+ _gaq.push(['_trackPageview']);
+ (function() {
+ var ga = document.createElement('script'); ga.type = 'text/javascript'; ga.async = true;
+ ga.src = ('https:' == document.location.protocol ? 'https://ssl' : 'http://www') + '.google-analytics.com/ga.js';
+ var s = document.getElementsByTagName('script')[0]; s.parentNode.insertBefore(ga, s);
+ })();
+
+ <!-- Adds slight delay to links to allow async reporting -->
+ function trackOutboundLink(link, category, action) {
+ try {
+ _gaq.push(['_trackEvent', category , action]);
+ } catch(err){}
+
+ setTimeout(function() {
+ document.location.href = link.href;
+ }, 100);
+ }
+ </script>
+
+ <!-- HTML5 shim and Respond.js IE8 support of HTML5 elements and media queries -->
+ <!--[if lt IE 9]>
+ <script src="https://oss.maxcdn.com/libs/html5shiv/3.7.0/html5shiv.js"></script>
+ <script src="https://oss.maxcdn.com/libs/respond.js/1.3.0/respond.min.js"></script>
+ <![endif]-->
+</head>
+
+<body>
+
+<div class="container" style="max-width: 1200px;">
+
+<div class="masthead">
+
+ <p class="lead">
+ <a href="/">
+ <img src="/images/spark-logo.png"
+ style="height:100px; width:auto; vertical-align: bottom; margin-top: 20px;"></a><span class="tagline">
+ Lightning-fast cluster computing
+ </span>
+ </p>
+
+</div>
+
+<nav class="navbar navbar-default" role="navigation">
+ <!-- Brand and toggle get grouped for better mobile display -->
+ <div class="navbar-header">
+ <button type="button" class="navbar-toggle" data-toggle="collapse"
+ data-target="#navbar-collapse-1">
+ <span class="sr-only">Toggle navigation</span>
+ <span class="icon-bar"></span>
+ <span class="icon-bar"></span>
+ <span class="icon-bar"></span>
+ </button>
+ </div>
+
+ <!-- Collect the nav links, forms, and other content for toggling -->
+ <div class="collapse navbar-collapse" id="navbar-collapse-1">
+ <ul class="nav navbar-nav">
+ <li><a href="/downloads.html">Download</a></li>
+ <li class="dropdown">
+ <a href="#" class="dropdown-toggle" data-toggle="dropdown">
+ Related Projects <b class="caret"></b>
+ </a>
+ <ul class="dropdown-menu">
+
+ <li><a href="/sql/">Spark SQL</a></li>
+ <li><a href="/streaming/">Spark Streaming</a></li>
+ <li><a href="/mllib/">MLlib (machine learning)</a></li>
+ <li><a href="/graphx/">GraphX (graph)</a></li>
+ </ul>
+ </li>
+ <li class="dropdown">
+ <a href="#" class="dropdown-toggle" data-toggle="dropdown">
+ Documentation <b class="caret"></b>
+ </a>
+ <ul class="dropdown-menu">
+ <li><a href="/documentation.html">Overview</a></li>
+ <li><a href="/docs/latest/">Latest Release (Spark 1.0.1)</a></li>
+ <li><a href="/examples.html">Examples</a></li>
+ </ul>
+ </li>
+ <li class="dropdown">
+ <a href="#" class="dropdown-toggle" data-toggle="dropdown">
+ Community <b class="caret"></b>
+ </a>
+ <ul class="dropdown-menu">
+ <li><a href="/community.html">Mailing Lists</a></li>
+ <li><a href="/community.html#events">Events and Meetups</a></li>
+ <li><a href="/community.html#history">Project History</a></li>
+ <li><a href="https://cwiki.apache.org/confluence/display/SPARK/Powered+By+Spark">Powered By</a></li>
+ </ul>
+ </li>
+ <li><a href="/faq.html">FAQ</a></li>
+ </ul>
+ </div>
+ <!-- /.navbar-collapse -->
+</nav>
+
+
+<div class="row">
+ <div class="col-md-3 col-md-push-9">
+ <div class="news" style="margin-bottom: 20px;">
+ <h5>Latest News</h5>
+ <ul class="list-unstyled">
+
+ <li><a href="/news/spark-1-0-1-released.html">Spark 1.0.1 released</a>
+ <span class="small">(Jul 11, 2014)</span></li>
+
+ <li><a href="/news/two-weeks-to-spark-summit-2014.html">Two weeks to Spark Summit 2014</a>
+ <span class="small">(Jun 16, 2014)</span></li>
+
+ <li><a href="/news/spark-1-0-0-released.html">Spark 1.0.0 released</a>
+ <span class="small">(May 30, 2014)</span></li>
+
+ <li><a href="/news/spark-summit-agenda-posted.html">Spark Summit agenda posted</a>
+ <span class="small">(May 11, 2014)</span></li>
+
+ </ul>
+ <p class="small" style="text-align: right;"><a href="/news/index.html">Archive</a></p>
+ </div>
+ <div class="hidden-xs hidden-sm">
+ <a href="/downloads.html" class="btn btn-success btn-lg btn-block" style="margin-bottom: 30px;">
+ Download Spark
+ </a>
+ <p style="font-size: 16px; font-weight: 500; color: #555;">
+ Related Projects:
+ </p>
+ <ul class="list-narrow">
+
+ <li><a href="/sql/">Spark SQL</a></li>
+ <li><a href="/streaming/">Spark Streaming</a></li>
+ <li><a href="/mllib/">MLlib (machine learning)</a></li>
+ <li><a href="/graphx/">GraphX (graph)</a></li>
+ </ul>
+ </div>
+ </div>
+
+ <div class="col-md-9 col-md-pull-3">
+ <h2>Spark Release 1.0.1</h2>
+
+
+<p>Spark 1.0.1 is a maintenance release with several stability fixes and a few new features in Spark’s SQL (alpha) library. This release is based on the <a href="https://github.com/apache/spark/tree/branch-1.0">branch-1.0</a> maintenance branch of Spark. We recommend users follow the head of this branch to get the most recent stable version of Spark.</p>
+
+<p>You can download Spark 1.0.1 as either a
+<a href="http://d3kbcqa49mib13.cloudfront.net/spark-1.0.1.tgz" onclick="trackOutboundLink(this, 'Release Download Links', 'cloudfront_spark-1.0.1.tgz'); return false;">source package</a>
+(5 MB tgz) or a prebuilt package for
+<a href="http://d3kbcqa49mib13.cloudfront.net/spark-1.0.1-bin-hadoop1.tgz" onclick="trackOutboundLink(this, 'Release Download Links', 'cloudfront_spark-1.0.1-bin-hadoop1.tgz'); return false;">Hadoop 1 / CDH3</a>,
+<a href="http://d3kbcqa49mib13.cloudfront.net/spark-1.0.1-bin-cdh4.tgz" onclick="trackOutboundLink(this, 'Release Download Links', 'cloudfront_spark-1.0.1-bin-cdh4.tgz'); return false;">CDH4</a>, or
+<a href="http://d3kbcqa49mib13.cloudfront.net/spark-1.0.1-bin-hadoop2.tgz" onclick="trackOutboundLink(this, 'Release Download Links', 'cloudfront_spark-1.0.1-bin-hadoop2.tgz'); return false;">Hadoop 2 / CDH5 / HDP2</a>
+(160 MB tgz). Release signatures and checksums are available at the official <a href="http://www.apache.org/dist/spark/spark-1.0.1/">Apache download site</a>.</p>
+
+<h3 id="fixes">Fixes</h3>
+<p>Spark 1.0.1 contains stability fixes in several components. Some of the more important fixes are highlighted below. You can visit the <a href="http://s.apache.org/5zh">Spark issue tracker</a> for an exhaustive list of fixes.</p>
+
+<h4 id="spark-core">Spark Core</h4>
+<ul>
+ <li>Issue with missing keys during external aggregations (<a href="https://issues.apache.org/jira/browse/SPARK-2043">SPARK-2043</a>)</li>
+ <li>Issue during job failures in Mesos mode (<a href="https://issues.apache.org/jira/browse/SPARK-1749">SPARK-1749</a>)</li>
+ <li>Error when defining case classes in Scala shell (<a href="https://issues.apache.org/jira/browse/SPARK-1199">SPARK-1199</a>)</li>
+ <li>Proper support for r3.xlarge instances on AWS (<a href="https://issues.apache.org/jira/browse/SPARK-1790">SPARK-1790</a>)</li>
+</ul>
+
+<h4 id="pyspark">PySpark</h4>
+<ul>
+ <li>Issue causing crashes when large numbers of tasks finish quickly (<a href="https://issues.apache.org/jira/browse/SPARK-2282">SPARK-2282</a>)</li>
+ <li>Issue importing MLlib in YARN-client mode (<a href="https://issues.apache.org/jira/browse/SPARK-2172">SPARK-2172</a>)</li>
+ <li>Incorrect behavior when hashing None (<a href="https://issues.apache.org/jira/browse/SPARK-1468">SPARK-1468</a>)</li>
+</ul>
+
+<h4 id="mllib">MLlib</h4>
+<ul>
+ <li>Added compatibility for numpy 1.4 (<a href="https://issues.apache.org/jira/browse/SPARK-2091">SPARK-2091</a>)</li>
+ <li>Concurrency issue in random sampler (<a href="https://issues.apache.org/jira/browse/SPARK-2251">SPARK-2251</a>)</li>
+ <li>NotSerailizable exception in ALS (<a href="https://issues.apache.org/jira/browse/SPARK-1977">SPARK-1977</a>)</li>
+</ul>
+
+<h4 id="streaming">Streaming</h4>
+<ul>
+ <li>Key not found when slow receiver starts (<a href="https://issues.apache.org/jira/browse/SPARK-2009">SPARK-2009</a>)</li>
+ <li>Resource clean-up with KafkaInputDStream (<a href="https://issues.apache.org/jira/browse/SPARK-2034">SPARK-2034</a>)</li>
+ <li>Issue with Flume events larger than 1020 bytes (<a href="https://issues.apache.org/jira/browse/SPARK-1916">SPARK-1916</a>)</li>
+</ul>
+
+<h3 id="sparksql-features">SparkSQL Features</h3>
+<ul>
+ <li>Support for querying JSON datasets (<a href="https://issues.apache.org/jira/browse/SPARK-2060">SPARK-2060</a>).</li>
+ <li>Improved reading and writing Parquet data, including support for nested records and arrays (<a href="https://issues.apache.org/jira/browse/SPARK-1293">SPARK-1293</a>, <a href="https://issues.apache.org/jira/browse/SPARK-2195">SPARK-2195</a>, <a href="https://issues.apache.org/jira/browse/SPARK-1913">SPARK-1913</a>, and <a href="https://issues.apache.org/jira/browse/SPARK-1487">SPARK-1487</a>).</li>
+ <li>Improved support for SQL commands (<code>CACHE TABLE</code>, <code>DESCRIBE</code>, SHOW TABLES) (<a href="https://issues.apache.org/jira/browse/SPARK-1968">SPARK-1968</a>, <a href="https://issues.apache.org/jira/browse/SPARK-2128">SPARK-2128</a>, and <a href="https://issues.apache.org/jira/browse/SPARK-1704">SPARK-1704</a>).</li>
+ <li>Support for SQL specific configuration (initially used for setting number of partitions) (<a href="https://issues.apache.org/jira/browse/SPARK-1508">SPARK-1508</a>).</li>
+ <li>Idempotence for DDL operations (<a href="https://issues.apache.org/jira/browse/SPARK-2191">SPARK-2191</a>).</li>
+</ul>
+
+<h3 id="known-issues">Known Issues</h3>
+<p>This release contains one known issue: multi-statement lines the REPL with internal references (<code>&gt; val x = 10; val y = x + 10</code>) produce exceptions (<a href="https://issues.apache.org/jira/browse/SPARK-2452">SPARK-2452</a>). This will be fixed shortly on the 1.0 branch; the fix will be included in the 1.0.2 release.</p>
+
+<h3 id="contributors">Contributors</h3>
+<p>The following developers contributed to this release:</p>
+
+<ul>
+ <li>Aaron Davidson &#8211; bug fixes in PySpark and Spark core</li>
+ <li>Ali Ghodsi &#8211; documentation update</li>
+ <li>Anant &#8211; compatibility fix for spark-ec2 script</li>
+ <li>Anatoli Fomenko &#8211; MLlib doc fix</li>
+ <li>Andre Schumacher &#8211; nested Parquet data</li>
+ <li>Andrew Ash &#8211; documentation</li>
+ <li>Andrew Or &#8211; bug fixes and documentation</li>
+ <li>Ankur Dave &#8211; bug fixes</li>
+ <li>Arkadiusz Komarzewski &#8211; doc fix</li>
+ <li>Baishuo &#8211; sql fix</li>
+ <li>Chen Chao &#8211; comment fix and bug fix</li>
+ <li>Cheng Hao &#8211; SQL features</li>
+ <li>Cheng Lian &#8211; SQL features</li>
+ <li>Christian Tzolov &#8211; build improvmenet</li>
+ <li>Clément MATHIEU &#8211; doc updates </li>
+ <li>CodingCat &#8211; doc updates and bug fix </li>
+ <li>Colin McCabe &#8211; bug fix</li>
+ <li>Daoyuan &#8211; SQL joins</li>
+ <li>David Lemieux &#8211; bug fix</li>
+ <li>Derek Ma &#8211; bug fix</li>
+ <li>Doris Xin &#8211; bug fix</li>
+ <li>Erik Selin &#8211; PySpark fix</li>
+ <li>Gang Bai &#8211; bug fix</li>
+ <li>Guoqiang Li &#8211; bug fixes</li>
+ <li>Henry Saputra &#8211; documentation</li>
+ <li>Jiang &#8211; doc fix</li>
+ <li>Joy Yoj &#8211; bug fix</li>
+ <li>Jyotiska NK &#8211; test improvement</li>
+ <li>Kan Zhang &#8211; PySpark SQL features</li>
+ <li>Kay Ousterhout &#8211; documentation fix</li>
+ <li>LY Lai &#8211; bug fix</li>
+ <li>Lars Albertsson &#8211; bug fix </li>
+ <li>Lei Zhang &#8211; SQL fix and feature</li>
+ <li>Mark Hamstra &#8211; bug fix</li>
+ <li>Matei Zaharia &#8211; doc updates and bug fix</li>
+ <li>Matthew Farrellee &#8211; bug fixes</li>
+ <li>Michael Armbrust &#8211; sql features and fixes</li>
+ <li>Neville Li &#8211; buf fix</li>
+ <li>Nick Chammas &#8211; doc fix</li>
+ <li>Ori Kremer &#8211; bug fix</li>
+ <li>Patrick Wendell &#8211; documentation and release manager</li>
+ <li>Prashant Sharma &#8211; bug and doc fixes</li>
+ <li>Qiuzhuang.Lian &#8211; bug fix</li>
+ <li>Raymond Liu &#8211; bug fix</li>
+ <li>Ravikanth Nawada &#8211; bug fixes</li>
+ <li>Reynold Xin &#8211; bug and doc fixes</li>
+ <li>Sameer Agarwal &#8211; optimization</li>
+ <li>Sandy Ryza &#8211; doc fix</li>
+ <li>Sean Owen &#8211; bug fix</li>
+ <li>Sebastien Rainville &#8211; bug fix</li>
+ <li>Shixiong Zhu &#8211; code clean-up</li>
+ <li>Szul, Piotr &#8211; bug fix</li>
+ <li>Takuya UESHIN &#8211; bug fixes and SQL features</li>
+ <li>Thomas Graves &#8211; bug fix </li>
+ <li>Uri Laserson &#8211; bug fix</li>
+ <li>Vadim Chekan &#8211; bug fix</li>
+ <li>Varakhedi Sujeet &#8211; ec2 r3 support</li>
+ <li>Vlad &#8211; doc fix</li>
+ <li>Wang Lianhui &#8211; bug fix</li>
+ <li>Wenchen Fan &#8211; optimization</li>
+ <li>William Benton &#8211; SQL feature</li>
+ <li>Xi Liu &#8211; SQL feature</li>
+ <li>Xiangrui Meng &#8211; bug fix</li>
+ <li>Ximo Guanter Gonzalbez &#8211; SQL feature</li>
+ <li>Yadid Ayzenberg &#8211; doc fix</li>
+ <li>Yijie Shen &#8211; buf fix</li>
+ <li>Yin Huai &#8211; JSON support and bug fixes</li>
+ <li>Zhen Peng &#8211; bug fix</li>
+ <li>Zichuan Ye &#8211; ec2 fixes</li>
+ <li>Zongheng Yang &#8211; sql fixes</li>
+</ul>
+
+<p><em>Thanks to everyone who contributed!</em></p>
+
+
+<p>
+<br/>
+<a href="/news/">Spark News Archive</a>
+</p>
+
+ </div>
+</div>
+
+
+
+<footer class="small">
+ <hr>
+ Apache Spark, Spark, Apache, and the Spark logo are trademarks of
+ <a href="http://www.apache.org">The Apache Software Foundation</a>.
+</footer>
+
+</div>
+
+<script src="https://code.jquery.com/jquery.js"></script>
+<script src="//netdna.bootstrapcdn.com/bootstrap/3.0.3/js/bootstrap.min.js"></script>
+<script src="/js/lang-tabs.js"></script>
+
+</body>
+</html>