summaryrefslogtreecommitdiff
path: root/site/third-party-projects.html
diff options
context:
space:
mode:
Diffstat (limited to 'site/third-party-projects.html')
-rw-r--r--site/third-party-projects.html287
1 files changed, 287 insertions, 0 deletions
diff --git a/site/third-party-projects.html b/site/third-party-projects.html
new file mode 100644
index 000000000..58d48936d
--- /dev/null
+++ b/site/third-party-projects.html
@@ -0,0 +1,287 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+ <meta charset="utf-8">
+ <meta http-equiv="X-UA-Compatible" content="IE=edge">
+ <meta name="viewport" content="width=device-width, initial-scale=1.0">
+
+ <title>
+ Third-Party Projects | Apache Spark
+
+ </title>
+
+
+
+
+
+ <!-- Bootstrap core CSS -->
+ <link href="/css/cerulean.min.css" rel="stylesheet">
+ <link href="/css/custom.css" rel="stylesheet">
+
+ <!-- Code highlighter CSS -->
+ <link href="/css/pygments-default.css" rel="stylesheet">
+
+ <script type="text/javascript">
+ <!-- Google Analytics initialization -->
+ var _gaq = _gaq || [];
+ _gaq.push(['_setAccount', 'UA-32518208-2']);
+ _gaq.push(['_trackPageview']);
+ (function() {
+ var ga = document.createElement('script'); ga.type = 'text/javascript'; ga.async = true;
+ ga.src = ('https:' == document.location.protocol ? 'https://ssl' : 'http://www') + '.google-analytics.com/ga.js';
+ var s = document.getElementsByTagName('script')[0]; s.parentNode.insertBefore(ga, s);
+ })();
+
+ <!-- Adds slight delay to links to allow async reporting -->
+ function trackOutboundLink(link, category, action) {
+ try {
+ _gaq.push(['_trackEvent', category , action]);
+ } catch(err){}
+
+ setTimeout(function() {
+ document.location.href = link.href;
+ }, 100);
+ }
+ </script>
+
+ <!-- HTML5 shim and Respond.js IE8 support of HTML5 elements and media queries -->
+ <!--[if lt IE 9]>
+ <script src="https://oss.maxcdn.com/libs/html5shiv/3.7.0/html5shiv.js"></script>
+ <script src="https://oss.maxcdn.com/libs/respond.js/1.3.0/respond.min.js"></script>
+ <![endif]-->
+</head>
+
+<body>
+
+<script src="https://code.jquery.com/jquery.js"></script>
+<script src="https://netdna.bootstrapcdn.com/bootstrap/3.0.3/js/bootstrap.min.js"></script>
+<script src="/js/lang-tabs.js"></script>
+<script src="/js/downloads.js"></script>
+
+<div class="container" style="max-width: 1200px;">
+
+<div class="masthead">
+
+ <p class="lead">
+ <a href="/">
+ <img src="/images/spark-logo-trademark.png"
+ style="height:100px; width:auto; vertical-align: bottom; margin-top: 20px;"></a><span class="tagline">
+ Lightning-fast cluster computing
+ </span>
+ </p>
+
+</div>
+
+<nav class="navbar navbar-default" role="navigation">
+ <!-- Brand and toggle get grouped for better mobile display -->
+ <div class="navbar-header">
+ <button type="button" class="navbar-toggle" data-toggle="collapse"
+ data-target="#navbar-collapse-1">
+ <span class="sr-only">Toggle navigation</span>
+ <span class="icon-bar"></span>
+ <span class="icon-bar"></span>
+ <span class="icon-bar"></span>
+ </button>
+ </div>
+
+ <!-- Collect the nav links, forms, and other content for toggling -->
+ <div class="collapse navbar-collapse" id="navbar-collapse-1">
+ <ul class="nav navbar-nav">
+ <li><a href="/downloads.html">Download</a></li>
+ <li class="dropdown">
+ <a href="#" class="dropdown-toggle" data-toggle="dropdown">
+ Libraries <b class="caret"></b>
+ </a>
+ <ul class="dropdown-menu">
+ <li><a href="/sql/">SQL and DataFrames</a></li>
+ <li><a href="/streaming/">Spark Streaming</a></li>
+ <li><a href="/mllib/">MLlib (machine learning)</a></li>
+ <li><a href="/graphx/">GraphX (graph)</a></li>
+ <li class="divider"></li>
+ <li><a href="/third-party-projects.html">Third-Party Projects</a></li>
+ </ul>
+ </li>
+ <li class="dropdown">
+ <a href="#" class="dropdown-toggle" data-toggle="dropdown">
+ Documentation <b class="caret"></b>
+ </a>
+ <ul class="dropdown-menu">
+ <li><a href="/docs/latest/">Latest Release (Spark 2.0.2)</a></li>
+ <li><a href="/documentation.html">Older Versions and Other Resources</a></li>
+ </ul>
+ </li>
+ <li><a href="/examples.html">Examples</a></li>
+ <li class="dropdown">
+ <a href="/community.html" class="dropdown-toggle" data-toggle="dropdown">
+ Community <b class="caret"></b>
+ </a>
+ <ul class="dropdown-menu">
+ <li><a href="/community.html#mailing-lists">Mailing Lists</a></li>
+ <li><a href="/contributing.html">Contributing to Spark</a></li>
+ <li><a href="https://issues.apache.org/jira/browse/SPARK">Issue Tracker</a></li>
+ <li><a href="/community.html#events">Events and Meetups</a></li>
+ <li><a href="/community.html#history">Project History</a></li>
+ <li><a href="/powered-by.html">Powered By</a></li>
+ <li><a href="/committers.html">Project Committers</a></li>
+ </ul>
+ </li>
+ <li><a href="/faq.html">FAQ</a></li>
+ </ul>
+ <ul class="nav navbar-nav navbar-right">
+ <li class="dropdown">
+ <a href="http://www.apache.org/" class="dropdown-toggle" data-toggle="dropdown">
+ Apache Software Foundation <b class="caret"></b></a>
+ <ul class="dropdown-menu">
+ <li><a href="http://www.apache.org/">Apache Homepage</a></li>
+ <li><a href="http://www.apache.org/licenses/">License</a></li>
+ <li><a href="http://www.apache.org/foundation/sponsorship.html">Sponsorship</a></li>
+ <li><a href="http://www.apache.org/foundation/thanks.html">Thanks</a></li>
+ <li><a href="http://www.apache.org/security/">Security</a></li>
+ </ul>
+ </li>
+ </ul>
+ </div>
+ <!-- /.navbar-collapse -->
+</nav>
+
+
+<div class="row">
+ <div class="col-md-3 col-md-push-9">
+ <div class="news" style="margin-bottom: 20px;">
+ <h5>Latest News</h5>
+ <ul class="list-unstyled">
+
+ <li><a href="/news/spark-wins-cloudsort-100tb-benchmark.html">Spark wins CloudSort Benchmark as the most efficient engine</a>
+ <span class="small">(Nov 15, 2016)</span></li>
+
+ <li><a href="/news/spark-2-0-2-released.html">Spark 2.0.2 released</a>
+ <span class="small">(Nov 14, 2016)</span></li>
+
+ <li><a href="/news/spark-1-6-3-released.html">Spark 1.6.3 released</a>
+ <span class="small">(Nov 07, 2016)</span></li>
+
+ <li><a href="/news/spark-2-0-1-released.html">Spark 2.0.1 released</a>
+ <span class="small">(Oct 03, 2016)</span></li>
+
+ </ul>
+ <p class="small" style="text-align: right;"><a href="/news/index.html">Archive</a></p>
+ </div>
+ <div class="hidden-xs hidden-sm">
+ <a href="/downloads.html" class="btn btn-success btn-lg btn-block" style="margin-bottom: 30px;">
+ Download Spark
+ </a>
+ <p style="font-size: 16px; font-weight: 500; color: #555;">
+ Built-in Libraries:
+ </p>
+ <ul class="list-none">
+ <li><a href="/sql/">SQL and DataFrames</a></li>
+ <li><a href="/streaming/">Spark Streaming</a></li>
+ <li><a href="/mllib/">MLlib (machine learning)</a></li>
+ <li><a href="/graphx/">GraphX (graph)</a></li>
+ </ul>
+ <a href="/third-party-projects.html">Third-Party Projects</a>
+ </div>
+ </div>
+
+ <div class="col-md-9 col-md-pull-3">
+ <p>This page tracks external software projects that supplement Apache Spark and add to its ecosystem.</p>
+
+<h2>spark-packages.org</h2>
+
+<p><a href="https://spark-packages.org/">spark-packages.org</a> is an external,
+community-managed list of third-party libraries, add-ons, and applications that work with
+Apache Spark. You can add a package as long as you have a GitHub repository.</p>
+
+<h2>Infrastructure Projects</h2>
+
+<ul>
+ <li><a href="https://github.com/spark-jobserver/spark-jobserver">Spark Job Server</a> -
+REST interface for managing and submitting Spark jobs on the same cluster
+(see <a href="http://engineering.ooyala.com/blog/open-sourcing-our-spark-job-server">blog post</a>
+for details)</li>
+ <li><a href="https://github.com/amplab-extras/SparkR-pkg">SparkR</a> - R frontend for Spark</li>
+ <li><a href="http://mlbase.org/">MLbase</a> - Machine Learning research project on top of Spark</li>
+ <li><a href="http://mesos.apache.org/">Apache Mesos</a> - Cluster management system that supports
+running Spark</li>
+ <li><a href="http://alluxio.org/">Alluxio</a> (née Tachyon) - Memory speed virtual distributed
+storage system that supports running Spark</li>
+ <li><a href="https://github.com/datastax/spark-cassandra-connector">Spark Cassandra Connector</a> -
+Easily load your Cassandra data into Spark and Spark SQL; from Datastax</li>
+ <li><a href="http://github.com/tuplejump/FiloDB">FiloDB</a> - a Spark integrated analytical/columnar
+database, with in-memory option capable of sub-second concurrent queries</li>
+ <li><a href="http://www.elasticsearch.org/guide/en/elasticsearch/hadoop/master/spark.html#spark-sql">ElasticSearch -
+Spark SQL</a> Integration</li>
+ <li><a href="https://github.com/tresata/spark-scalding">Spark-Scalding</a> - Easily transition
+Cascading/Scalding code to Spark</li>
+ <li><a href="http://zeppelin-project.org/">Zeppelin</a> - an IPython-like notebook for Spark. There
+is also <a href="https://github.com/tribbloid/ISpark">ISpark</a>, and the
+<a href="https://github.com/andypetrella/spark-notebook/">Spark Notebook</a>.</li>
+ <li><a href="http://www.ibm.com/developerworks/servicemanagement/tc/pcs/index.html">IBM Spectrum Conductor with Spark</a> -
+cluster management software that integrates with Spark</li>
+ <li><a href="https://github.com/EclairJS/eclairjs-node">EclairJS</a> - enables Node.js developers to code
+against Spark, and data scientists to use Javascript in Jupyter notebooks.</li>
+ <li><a href="https://github.com/SnappyDataInc/snappydata">SnappyData</a> - an open source
+OLTP + OLAP database integrated with Spark on the same JVMs.</li>
+ <li><a href="https://github.com/DataSystemsLab/GeoSpark">GeoSpark</a> - Geospatial RDDs and joins</li>
+ <li><a href="https://github.com/ispras/spark-openstack">Spark Cluster Deploy Tools for OpenStack</a></li>
+</ul>
+
+<h2>Applications Using Spark</h2>
+
+<ul>
+ <li><a href="http://mahout.apache.org/">Apache Mahout</a> - Previously on Hadoop MapReduce,
+Mahout has switched to using Spark as the backend</li>
+ <li><a href="https://wiki.apache.org/mrql/">Apache MRQL</a> - A query processing and optimization
+system for large-scale, distributed data analysis, built on top of Apache Hadoop, Hama, and Spark</li>
+ <li><a href="http://blinkdb.org/">BlinkDB</a> - a massively parallel, approximate query engine built
+on top of Shark and Spark</li>
+ <li><a href="https://github.com/adobe-research/spindle">Spindle</a> - Spark/Parquet-based web
+analytics query engine</li>
+ <li><a href="http://simin.me/projects/spatialspark/">Spark Spatial</a> - Spatial joins and
+processing for Spark</li>
+ <li><a href="https://github.com/thunderain-project/thunderain">Thunderain</a> - a framework
+for combining stream processing with historical data, think Lambda architecture</li>
+ <li><a href="https://github.com/AyasdiOpenSource/df">DF</a> from Ayasdi - a Pandas-like data frame
+implementation for Spark</li>
+ <li><a href="https://github.com/OryxProject/oryx">Oryx</a> - Lambda architecture on Apache Spark,
+Apache Kafka for real-time large scale machine learning</li>
+ <li><a href="https://github.com/bigdatagenomics/adam">ADAM</a> - A framework and CLI for loading,
+transforming, and analyzing genomic data using Apache Spark</li>
+</ul>
+
+<h2>Additional Language Bindings</h2>
+
+<h3>C# / .NET</h3>
+
+<ul>
+ <li><a href="https://github.com/Microsoft/SparkCLR">CLR for Spark</a></li>
+</ul>
+
+<h3>Clojure</h3>
+
+<ul>
+ <li><a href="https://github.com/TheClimateCorporation/clj-spark">clj-spark</a></li>
+ <li><a href="http://spark-packages.org/package/21">Sparkling</a></li>
+</ul>
+
+<h3>Groovy</h3>
+
+<ul>
+ <li><a href="https://github.com/bunions1/groovy-spark-example">groovy-spark-example</a></li>
+</ul>
+
+ </div>
+</div>
+
+
+
+<footer class="small">
+ <hr>
+ Apache Spark, Spark, Apache, and the Spark logo are <a href="/trademarks.html">trademarks</a> of
+ <a href="http://www.apache.org">The Apache Software Foundation</a>.
+</footer>
+
+</div>
+
+</body>
+</html>