summaryrefslogtreecommitdiff
path: root/site/docs/0.6.1/api/core/spark/rdd/UnionRDD.html
diff options
context:
space:
mode:
Diffstat (limited to 'site/docs/0.6.1/api/core/spark/rdd/UnionRDD.html')
-rw-r--r--site/docs/0.6.1/api/core/spark/rdd/UnionRDD.html964
1 files changed, 964 insertions, 0 deletions
diff --git a/site/docs/0.6.1/api/core/spark/rdd/UnionRDD.html b/site/docs/0.6.1/api/core/spark/rdd/UnionRDD.html
new file mode 100644
index 000000000..0bb390183
--- /dev/null
+++ b/site/docs/0.6.1/api/core/spark/rdd/UnionRDD.html
@@ -0,0 +1,964 @@
+<?xml version='1.0' encoding='UTF-8'?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1//EN" "http://www.w3.org/TR/xhtml11/DTD/xhtml11.dtd">
+<html>
+ <head>
+ <title>spark.rdd.UnionRDD</title>
+ <meta http-equiv="content-type" content="text/html; charset=UTF-8" />
+
+ <link type="text/css" media="screen" rel="stylesheet" href="../../lib/template.css" />
+ <script type="text/javascript" src="../../lib/jquery.js"></script>
+ <script type="text/javascript" src="../../lib/jquery-ui.js"></script>
+ <script type="text/javascript" src="../../lib/template.js"></script>
+ <script type="text/javascript" src="../../lib/tools.tooltip.js"></script>
+
+ </head>
+ <body onload="sh_highlightDocument('../lib/', '.min.js');" class="type">
+ <div id="definition">
+ <img src="../../lib/class_big.png" />
+ <p id="owner"><a name="spark" class="extype" href="../package.html">spark</a>.<a name="spark.rdd" class="extype" href="package.html">rdd</a></p>
+ <h1>UnionRDD</h1>
+ </div>
+
+ <h4 class="signature" id="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">class</span>
+ </span>
+ <span class="symbol">
+ <span class="name">UnionRDD</span><span class="tparams">[<span name="T">T</span>]</span><span class="result"> extends <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T] with <span name="scala.Serializable" class="extype">Serializable</span></span>
+ </span>
+ </h4>
+
+ <div class="fullcommenttop" id="comment"><div class="toggleContainer block">
+ <span class="toggle">Linear Supertypes</span>
+ <div class="superTypes hiddenContent"><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T], <span name="scala.Serializable" class="extype">Serializable</span>, <span name="java.io.Serializable" class="extype">Serializable</span>, AnyRef, <span name="scala.Any" class="extype">Any</span></div>
+ </div></div>
+
+
+ <div id="mbrsel">
+ <div id="textfilter"><span class="pre"></span><span class="input"><input accesskey="/" type="text" /></span><span class="post"></span></div>
+ <div id="order">
+ <span class="filtertype">Ordering</span>
+ <ol><li class="alpha in"><span>Alphabetic</span></li><li class="inherit out"><span>By inheritance</span></li></ol>
+ </div>
+ <div id="ancestors">
+ <span class="filtertype">Inherited</span>
+ <ol><li class="hideall out"><span>Hide All</span></li>
+ <li class="showall in"><span>Show all</span></li></ol>
+ <ol id="linearization"><li name="spark.rdd.UnionRDD" class="in"><span>UnionRDD</span></li><li name="spark.RDD" class="in"><span>RDD</span></li><li name="scala.Serializable" class="in"><span>Serializable</span></li><li name="java.io.Serializable" class="in"><span>Serializable</span></li><li name="scala.AnyRef" class="in"><span>AnyRef</span></li><li name="scala.Any" class="in"><span>Any</span></li></ol>
+ </div>
+ <div id="visbl">
+ <span class="filtertype">Visibility</span>
+ <ol><li class="public in"><span>Public</span></li><li class="all out"><span>All</span></li></ol>
+ </div>
+ </div>
+
+ <div id="template">
+ <div id="allMembers">
+ <div class="members" id="constructors">
+ <h3>Instance Constructors</h3>
+ <ol><li visbl="pub" name="spark.rdd.UnionRDD#this" data-isabs="false">
+ <a id="this:UnionRDD[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">new</span>
+ </span>
+ <span class="symbol">
+ <span class="name">UnionRDD</span><span class="params">(<span name="sc">sc: <a name="spark.SparkContext" class="extype" href="../SparkContext.html">SparkContext</a></span>, <span name="rdds">rdds: Seq[<a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T]]</span>)</span><span class="params">(<span class="implicit">implicit </span><span name="arg0">arg0: ClassManifest[T]</span>)</span>
+ </span>
+ </h4>
+
+ </li></ol>
+ </div>
+
+
+
+
+
+ <div class="values members" id="values">
+ <h3>Value Members</h3>
+ <ol><li visbl="pub" name="scala.AnyRef#!=" data-isabs="false">
+ <a id="!=(AnyRef):Boolean"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name" title="gt4s: $bang$eq">!=</span><span class="params">(<span name="arg0">arg0: AnyRef</span>)</span><span class="result">: <span name="scala.Boolean" class="extype">Boolean</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef</dd></dl></div>
+ </li><li visbl="pub" name="scala.Any#!=" data-isabs="false">
+ <a id="!=(Any):Boolean"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name" title="gt4s: $bang$eq">!=</span><span class="params">(<span name="arg0">arg0: <span name="scala.Any" class="extype">Any</span></span>)</span><span class="result">: <span name="scala.Boolean" class="extype">Boolean</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>Any</dd></dl></div>
+ </li><li visbl="pub" name="scala.AnyRef###" data-isabs="false">
+ <a id="##():Int"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name" title="gt4s: $hash$hash">##</span><span class="params">()</span><span class="result">: <span name="scala.Int" class="extype">Int</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef → Any</dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#++" data-isabs="false">
+ <a id="++(RDD[T]):RDD[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name" title="gt4s: $plus$plus">++</span><span class="params">(<span name="other">other: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T]</span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return the union of this RDD and another one.</p><div class="fullcomment"><div class="comment cmt"><p>Return the union of this RDD and another one. Any identical elements will appear multiple
+times (use <code>.distinct()</code> to eliminate them).
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="scala.AnyRef#==" data-isabs="false">
+ <a id="==(AnyRef):Boolean"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name" title="gt4s: $eq$eq">==</span><span class="params">(<span name="arg0">arg0: AnyRef</span>)</span><span class="result">: <span name="scala.Boolean" class="extype">Boolean</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef</dd></dl></div>
+ </li><li visbl="pub" name="scala.Any#==" data-isabs="false">
+ <a id="==(Any):Boolean"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name" title="gt4s: $eq$eq">==</span><span class="params">(<span name="arg0">arg0: <span name="scala.Any" class="extype">Any</span></span>)</span><span class="result">: <span name="scala.Boolean" class="extype">Boolean</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>Any</dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#aggregate" data-isabs="false">
+ <a id="aggregate[U](U)((U, T) ⇒ U,(U, U) ⇒ U)(ClassManifest[U]):U"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">aggregate</span><span class="tparams">[<span name="U">U</span>]</span><span class="params">(<span name="zeroValue">zeroValue: U</span>)</span><span class="params">(<span name="seqOp">seqOp: (U, T) ⇒ U</span>, <span name="combOp">combOp: (U, U) ⇒ U</span>)</span><span class="params">(<span class="implicit">implicit </span><span name="arg0">arg0: ClassManifest[U]</span>)</span><span class="result">: U</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Aggregate the elements of each partition, and then the results for all the partitions, using
+given combine functions and a neutral &quot;zero value&quot;.</p><div class="fullcomment"><div class="comment cmt"><p>Aggregate the elements of each partition, and then the results for all the partitions, using
+given combine functions and a neutral &quot;zero value&quot;. This function can return a different result
+type, U, than the type of this RDD, T. Thus, we need one operation for merging a T into an U
+and one operation for merging two U's, as in scala.TraversableOnce. Both of these functions are
+allowed to modify and return their first argument instead of creating a new U to avoid memory
+allocation.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="scala.Any#asInstanceOf" data-isabs="false">
+ <a id="asInstanceOf[T0]:T0"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">asInstanceOf</span><span class="tparams">[<span name="T0">T0</span>]</span><span class="result">: T0</span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>Any</dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#cache" data-isabs="false">
+ <a id="cache():RDD[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">cache</span><span class="params">()</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Persist this RDD with the default storage level (<code>MEMORY_ONLY</code>).</p><div class="fullcomment"><div class="comment cmt"><p>Persist this RDD with the default storage level (<code>MEMORY_ONLY</code>).</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#cartesian" data-isabs="false">
+ <a id="cartesian[U](RDD[U])(ClassManifest[U]):RDD[(T, U)]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">cartesian</span><span class="tparams">[<span name="U">U</span>]</span><span class="params">(<span name="other">other: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[U]</span>)</span><span class="params">(<span class="implicit">implicit </span><span name="arg0">arg0: ClassManifest[U]</span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[(T, U)]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return the Cartesian product of this RDD and another one, that is, the RDD of all pairs of
+elements (a, b) where a is in <code>this</code> and b is in <code>other</code>.</p><div class="fullcomment"><div class="comment cmt"><p>Return the Cartesian product of this RDD and another one, that is, the RDD of all pairs of
+elements (a, b) where a is in <code>this</code> and b is in <code>other</code>.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="prt" name="scala.AnyRef#clone" data-isabs="false">
+ <a id="clone():AnyRef"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">clone</span><span class="params">()</span><span class="result">: AnyRef</span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Attributes</dt><dd>protected[<a name="java.lang" class="extype" href="../../java/lang/package.html">lang</a>] </dd><dt>Definition Classes</dt><dd>AnyRef</dd><dt>Annotations</dt><dd>
+ <span class="name">@throws</span><span class="args">()</span>
+
+ </dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#collect" data-isabs="false">
+ <a id="collect():Array[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">collect</span><span class="params">()</span><span class="result">: <span name="scala.Array" class="extype">Array</span>[T]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return an array that contains all of the elements in this RDD.</p><div class="fullcomment"><div class="comment cmt"><p>Return an array that contains all of the elements in this RDD.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.rdd.UnionRDD#compute" data-isabs="false">
+ <a id="compute(Split):Iterator[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">compute</span><span class="params">(<span name="s">s: <a name="spark.Split" class="extype" href="../Split.html">Split</a></span>)</span><span class="result">: Iterator[T]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Function for computing a given partition.</p><div class="fullcomment"><div class="comment cmt"><p>Function for computing a given partition.</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.rdd.UnionRDD" class="extype" href="">UnionRDD</a> → <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#context" data-isabs="false">
+ <a id="context:SparkContext"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">context</span><span class="result">: <a name="spark.SparkContext" class="extype" href="../SparkContext.html">SparkContext</a></span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">The <a name="spark.SparkContext" class="extype" href="../SparkContext.html">SparkContext</a> that this RDD was created on.</p><div class="fullcomment"><div class="comment cmt"><p>The <a name="spark.SparkContext" class="extype" href="../SparkContext.html">SparkContext</a> that this RDD was created on.</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#count" data-isabs="false">
+ <a id="count():Long"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">count</span><span class="params">()</span><span class="result">: <span name="scala.Long" class="extype">Long</span></span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return the number of elements in the RDD.</p><div class="fullcomment"><div class="comment cmt"><p>Return the number of elements in the RDD.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#countApprox" data-isabs="false">
+ <a id="countApprox(Long,Double):PartialResult[BoundedDouble]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">countApprox</span><span class="params">(<span name="timeout">timeout: <span name="scala.Long" class="extype">Long</span></span>, <span name="confidence">confidence: <span name="scala.Double" class="extype">Double</span> = <span class="symbol">0.95</span></span>)</span><span class="result">: <a name="spark.partial.PartialResult" class="extype" href="../partial/PartialResult.html">PartialResult</a>[<a name="spark.partial.BoundedDouble" class="extype" href="../partial/BoundedDouble.html">BoundedDouble</a>]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">(Experimental) Approximate version of count() that returns a potentially incomplete result
+within a timeout, even if not all tasks have finished.</p><div class="fullcomment"><div class="comment cmt"><p>(Experimental) Approximate version of count() that returns a potentially incomplete result
+within a timeout, even if not all tasks have finished.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#countByValue" data-isabs="false">
+ <a id="countByValue():Map[T, Long]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">countByValue</span><span class="params">()</span><span class="result">: <span name="scala.collection.Map" class="extype">Map</span>[T, <span name="scala.Long" class="extype">Long</span>]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return the count of each unique value in this RDD as a map of (value, count) pairs.</p><div class="fullcomment"><div class="comment cmt"><p>Return the count of each unique value in this RDD as a map of (value, count) pairs. The final
+combine step happens locally on the master, equivalent to running a single reduce task.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#countByValueApprox" data-isabs="false">
+ <a id="countByValueApprox(Long,Double):PartialResult[Map[T, BoundedDouble]]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">countByValueApprox</span><span class="params">(<span name="timeout">timeout: <span name="scala.Long" class="extype">Long</span></span>, <span name="confidence">confidence: <span name="scala.Double" class="extype">Double</span> = <span class="symbol">0.95</span></span>)</span><span class="result">: <a name="spark.partial.PartialResult" class="extype" href="../partial/PartialResult.html">PartialResult</a>[<span name="scala.collection.Map" class="extype">Map</span>[T, <a name="spark.partial.BoundedDouble" class="extype" href="../partial/BoundedDouble.html">BoundedDouble</a>]]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">(Experimental) Approximate version of countByValue().</p><div class="fullcomment"><div class="comment cmt"><p>(Experimental) Approximate version of countByValue().
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.rdd.UnionRDD#dependencies" data-isabs="false">
+ <a id="dependencies:List[spark.Dependency[_]]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">val</span>
+ </span>
+ <span class="symbol">
+ <span class="name">dependencies</span><span class="result">: <span name="scala.collection.immutable.List" class="extype">List</span>[spark.Dependency[_]]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">How this RDD depends on any parent RDDs.</p><div class="fullcomment"><div class="comment cmt"><p>How this RDD depends on any parent RDDs.</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.rdd.UnionRDD" class="extype" href="">UnionRDD</a> → <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#distinct" data-isabs="false">
+ <a id="distinct(Int):RDD[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">distinct</span><span class="params">(<span name="numSplits">numSplits: <span name="scala.Int" class="extype">Int</span> = <span class="symbol"><span class="name"><a href="../RDD.html#splits:Array[Split]">splits.size</a></span></span></span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return a new RDD containing the distinct elements in this RDD.</p><div class="fullcomment"><div class="comment cmt"><p>Return a new RDD containing the distinct elements in this RDD.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="scala.AnyRef#eq" data-isabs="false">
+ <a id="eq(AnyRef):Boolean"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">eq</span><span class="params">(<span name="arg0">arg0: AnyRef</span>)</span><span class="result">: <span name="scala.Boolean" class="extype">Boolean</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef</dd></dl></div>
+ </li><li visbl="pub" name="scala.AnyRef#equals" data-isabs="false">
+ <a id="equals(Any):Boolean"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">equals</span><span class="params">(<span name="arg0">arg0: <span name="scala.Any" class="extype">Any</span></span>)</span><span class="result">: <span name="scala.Boolean" class="extype">Boolean</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef → Any</dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#filter" data-isabs="false">
+ <a id="filter((T) ⇒ Boolean):RDD[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">filter</span><span class="params">(<span name="f">f: (T) ⇒ <span name="scala.Boolean" class="extype">Boolean</span></span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return a new RDD containing only the elements that satisfy a predicate.</p><div class="fullcomment"><div class="comment cmt"><p>Return a new RDD containing only the elements that satisfy a predicate.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="prt" name="scala.AnyRef#finalize" data-isabs="false">
+ <a id="finalize():Unit"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">finalize</span><span class="params">()</span><span class="result">: <span name="scala.Unit" class="extype">Unit</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Attributes</dt><dd>protected[<a name="java.lang" class="extype" href="../../java/lang/package.html">lang</a>] </dd><dt>Definition Classes</dt><dd>AnyRef</dd><dt>Annotations</dt><dd>
+ <span class="name">@throws</span><span class="args">()</span>
+
+ </dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#first" data-isabs="false">
+ <a id="first():T"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">first</span><span class="params">()</span><span class="result">: T</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return the first element in this RDD.</p><div class="fullcomment"><div class="comment cmt"><p>Return the first element in this RDD.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#flatMap" data-isabs="false">
+ <a id="flatMap[U]((T) ⇒ TraversableOnce[U])(ClassManifest[U]):RDD[U]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">flatMap</span><span class="tparams">[<span name="U">U</span>]</span><span class="params">(<span name="f">f: (T) ⇒ TraversableOnce[U]</span>)</span><span class="params">(<span class="implicit">implicit </span><span name="arg0">arg0: ClassManifest[U]</span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[U]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt"> Return a new RDD by first applying a function to all elements of this
+ RDD, and then flattening the results.</p><div class="fullcomment"><div class="comment cmt"><p> Return a new RDD by first applying a function to all elements of this
+ RDD, and then flattening the results.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#fold" data-isabs="false">
+ <a id="fold(T)((T, T) ⇒ T):T"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">fold</span><span class="params">(<span name="zeroValue">zeroValue: T</span>)</span><span class="params">(<span name="op">op: (T, T) ⇒ T</span>)</span><span class="result">: T</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Aggregate the elements of each partition, and then the results for all the partitions, using a
+given associative function and a neutral &quot;zero value&quot;.</p><div class="fullcomment"><div class="comment cmt"><p>Aggregate the elements of each partition, and then the results for all the partitions, using a
+given associative function and a neutral &quot;zero value&quot;. The function op(t1, t2) is allowed to
+modify t1 and return it as its result value to avoid object allocation; however, it should not
+modify t2.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#foreach" data-isabs="false">
+ <a id="foreach((T) ⇒ Unit):Unit"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">foreach</span><span class="params">(<span name="f">f: (T) ⇒ <span name="scala.Unit" class="extype">Unit</span></span>)</span><span class="result">: <span name="scala.Unit" class="extype">Unit</span></span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Applies a function f to all elements of this RDD.</p><div class="fullcomment"><div class="comment cmt"><p>Applies a function f to all elements of this RDD.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="scala.AnyRef#getClass" data-isabs="false">
+ <a id="getClass():java.lang.Class[_]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">getClass</span><span class="params">()</span><span class="result">: java.lang.Class[_]</span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef → Any</dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#getStorageLevel" data-isabs="false">
+ <a id="getStorageLevel:StorageLevel"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">getStorageLevel</span><span class="result">: <a name="spark.storage.StorageLevel" class="extype" href="../storage/StorageLevel.html">StorageLevel</a></span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Get the RDD's current storage level, or StorageLevel.</p><div class="fullcomment"><div class="comment cmt"><p>Get the RDD's current storage level, or StorageLevel.NONE if none is set.</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#glom" data-isabs="false">
+ <a id="glom():RDD[Array[T]]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">glom</span><span class="params">()</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[<span name="scala.Array" class="extype">Array</span>[T]]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return an RDD created by coalescing all elements within each partition into an array.</p><div class="fullcomment"><div class="comment cmt"><p>Return an RDD created by coalescing all elements within each partition into an array.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#groupBy" data-isabs="false">
+ <a id="groupBy[K]((T) ⇒ K)(ClassManifest[K]):RDD[(K, Seq[T])]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">groupBy</span><span class="tparams">[<span name="K">K</span>]</span><span class="params">(<span name="f">f: (T) ⇒ K</span>)</span><span class="params">(<span class="implicit">implicit </span><span name="arg0">arg0: ClassManifest[K]</span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[(K, Seq[T])]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return an RDD of grouped items.</p><div class="fullcomment"><div class="comment cmt"><p>Return an RDD of grouped items.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#groupBy" data-isabs="false">
+ <a id="groupBy[K]((T) ⇒ K,Int)(ClassManifest[K]):RDD[(K, Seq[T])]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">groupBy</span><span class="tparams">[<span name="K">K</span>]</span><span class="params">(<span name="f">f: (T) ⇒ K</span>, <span name="numSplits">numSplits: <span name="scala.Int" class="extype">Int</span></span>)</span><span class="params">(<span class="implicit">implicit </span><span name="arg0">arg0: ClassManifest[K]</span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[(K, Seq[T])]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return an RDD of grouped elements.</p><div class="fullcomment"><div class="comment cmt"><p>Return an RDD of grouped elements. Each group consists of a key and a sequence of elements
+mapping to that key.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="scala.AnyRef#hashCode" data-isabs="false">
+ <a id="hashCode():Int"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">hashCode</span><span class="params">()</span><span class="result">: <span name="scala.Int" class="extype">Int</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef → Any</dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#id" data-isabs="false">
+ <a id="id:Int"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">val</span>
+ </span>
+ <span class="symbol">
+ <span class="name">id</span><span class="result">: <span name="scala.Int" class="extype">Int</span></span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">A unique ID for this RDD (within its SparkContext).</p><div class="fullcomment"><div class="comment cmt"><p>A unique ID for this RDD (within its SparkContext).</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="scala.Any#isInstanceOf" data-isabs="false">
+ <a id="isInstanceOf[T0]:Boolean"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">isInstanceOf</span><span class="tparams">[<span name="T0">T0</span>]</span><span class="result">: <span name="scala.Boolean" class="extype">Boolean</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>Any</dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#iterator" data-isabs="false">
+ <a id="iterator(Split):Iterator[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">iterator</span><span class="params">(<span name="split">split: <a name="spark.Split" class="extype" href="../Split.html">Split</a></span>)</span><span class="result">: Iterator[T]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Internal method to this RDD; will read from cache if applicable, or otherwise compute it.</p><div class="fullcomment"><div class="comment cmt"><p>Internal method to this RDD; will read from cache if applicable, or otherwise compute it.
+This should <i>not</i> be called by users directly, but is available for implementors of custom
+subclasses of RDD.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#map" data-isabs="false">
+ <a id="map[U]((T) ⇒ U)(ClassManifest[U]):RDD[U]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">map</span><span class="tparams">[<span name="U">U</span>]</span><span class="params">(<span name="f">f: (T) ⇒ U</span>)</span><span class="params">(<span class="implicit">implicit </span><span name="arg0">arg0: ClassManifest[U]</span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[U]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return a new RDD by applying a function to all elements of this RDD.</p><div class="fullcomment"><div class="comment cmt"><p>Return a new RDD by applying a function to all elements of this RDD.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#mapPartitions" data-isabs="false">
+ <a id="mapPartitions[U]((Iterator[T]) ⇒ Iterator[U])(ClassManifest[U]):RDD[U]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">mapPartitions</span><span class="tparams">[<span name="U">U</span>]</span><span class="params">(<span name="f">f: (Iterator[T]) ⇒ Iterator[U]</span>)</span><span class="params">(<span class="implicit">implicit </span><span name="arg0">arg0: ClassManifest[U]</span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[U]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return a new RDD by applying a function to each partition of this RDD.</p><div class="fullcomment"><div class="comment cmt"><p>Return a new RDD by applying a function to each partition of this RDD.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#mapPartitionsWithSplit" data-isabs="false">
+ <a id="mapPartitionsWithSplit[U]((Int, Iterator[T]) ⇒ Iterator[U])(ClassManifest[U]):RDD[U]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">mapPartitionsWithSplit</span><span class="tparams">[<span name="U">U</span>]</span><span class="params">(<span name="f">f: (<span name="scala.Int" class="extype">Int</span>, Iterator[T]) ⇒ Iterator[U]</span>)</span><span class="params">(<span class="implicit">implicit </span><span name="arg0">arg0: ClassManifest[U]</span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[U]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return a new RDD by applying a function to each partition of this RDD, while tracking the index
+of the original partition.</p><div class="fullcomment"><div class="comment cmt"><p>Return a new RDD by applying a function to each partition of this RDD, while tracking the index
+of the original partition.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="scala.AnyRef#ne" data-isabs="false">
+ <a id="ne(AnyRef):Boolean"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">ne</span><span class="params">(<span name="arg0">arg0: AnyRef</span>)</span><span class="result">: <span name="scala.Boolean" class="extype">Boolean</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef</dd></dl></div>
+ </li><li visbl="pub" name="scala.AnyRef#notify" data-isabs="false">
+ <a id="notify():Unit"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">notify</span><span class="params">()</span><span class="result">: <span name="scala.Unit" class="extype">Unit</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef</dd></dl></div>
+ </li><li visbl="pub" name="scala.AnyRef#notifyAll" data-isabs="false">
+ <a id="notifyAll():Unit"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">notifyAll</span><span class="params">()</span><span class="result">: <span name="scala.Unit" class="extype">Unit</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef</dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#partitioner" data-isabs="false">
+ <a id="partitioner:Option[Partitioner]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">val</span>
+ </span>
+ <span class="symbol">
+ <span class="name">partitioner</span><span class="result">: <span name="scala.Option" class="extype">Option</span>[<a name="spark.Partitioner" class="extype" href="../Partitioner.html">Partitioner</a>]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Optionally overridden by subclasses to specify how they are partitioned.</p><div class="fullcomment"><div class="comment cmt"><p>Optionally overridden by subclasses to specify how they are partitioned.</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#persist" data-isabs="false">
+ <a id="persist():RDD[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">persist</span><span class="params">()</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Persist this RDD with the default storage level (<code>MEMORY_ONLY</code>).</p><div class="fullcomment"><div class="comment cmt"><p>Persist this RDD with the default storage level (<code>MEMORY_ONLY</code>).</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#persist" data-isabs="false">
+ <a id="persist(StorageLevel):RDD[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">persist</span><span class="params">(<span name="newLevel">newLevel: <a name="spark.storage.StorageLevel" class="extype" href="../storage/StorageLevel.html">StorageLevel</a></span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Set this RDD's storage level to persist its values across operations after the first time
+it is computed.</p><div class="fullcomment"><div class="comment cmt"><p>Set this RDD's storage level to persist its values across operations after the first time
+it is computed. Can only be called once on each RDD.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#pipe" data-isabs="false">
+ <a id="pipe(Seq[String],Map[String, String]):RDD[String]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">pipe</span><span class="params">(<span name="command">command: Seq[String]</span>, <span name="env">env: <span name="scala.collection.Map" class="extype">Map</span>[String, String]</span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[String]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return an RDD created by piping elements to a forked external process.</p><div class="fullcomment"><div class="comment cmt"><p>Return an RDD created by piping elements to a forked external process.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#pipe" data-isabs="false">
+ <a id="pipe(Seq[String]):RDD[String]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">pipe</span><span class="params">(<span name="command">command: Seq[String]</span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[String]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return an RDD created by piping elements to a forked external process.</p><div class="fullcomment"><div class="comment cmt"><p>Return an RDD created by piping elements to a forked external process.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#pipe" data-isabs="false">
+ <a id="pipe(String):RDD[String]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">pipe</span><span class="params">(<span name="command">command: String</span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[String]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return an RDD created by piping elements to a forked external process.</p><div class="fullcomment"><div class="comment cmt"><p>Return an RDD created by piping elements to a forked external process.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.rdd.UnionRDD#preferredLocations" data-isabs="false">
+ <a id="preferredLocations(Split):Seq[String]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">preferredLocations</span><span class="params">(<span name="s">s: <a name="spark.Split" class="extype" href="../Split.html">Split</a></span>)</span><span class="result">: Seq[String]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Optionally overridden by subclasses to specify placement preferences.</p><div class="fullcomment"><div class="comment cmt"><p>Optionally overridden by subclasses to specify placement preferences.</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.rdd.UnionRDD" class="extype" href="">UnionRDD</a> → <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#reduce" data-isabs="false">
+ <a id="reduce((T, T) ⇒ T):T"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">reduce</span><span class="params">(<span name="f">f: (T, T) ⇒ T</span>)</span><span class="result">: T</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Reduces the elements of this RDD using the specified associative binary operator.</p><div class="fullcomment"><div class="comment cmt"><p>Reduces the elements of this RDD using the specified associative binary operator.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#sample" data-isabs="false">
+ <a id="sample(Boolean,Double,Int):RDD[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">sample</span><span class="params">(<span name="withReplacement">withReplacement: <span name="scala.Boolean" class="extype">Boolean</span></span>, <span name="fraction">fraction: <span name="scala.Double" class="extype">Double</span></span>, <span name="seed">seed: <span name="scala.Int" class="extype">Int</span></span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return a sampled subset of this RDD.</p><div class="fullcomment"><div class="comment cmt"><p>Return a sampled subset of this RDD.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#saveAsObjectFile" data-isabs="false">
+ <a id="saveAsObjectFile(String):Unit"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">saveAsObjectFile</span><span class="params">(<span name="path">path: String</span>)</span><span class="result">: <span name="scala.Unit" class="extype">Unit</span></span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Save this RDD as a SequenceFile of serialized objects.</p><div class="fullcomment"><div class="comment cmt"><p>Save this RDD as a SequenceFile of serialized objects.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#saveAsTextFile" data-isabs="false">
+ <a id="saveAsTextFile(String):Unit"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">saveAsTextFile</span><span class="params">(<span name="path">path: String</span>)</span><span class="result">: <span name="scala.Unit" class="extype">Unit</span></span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Save this RDD as a text file, using string representations of elements.</p><div class="fullcomment"><div class="comment cmt"><p>Save this RDD as a text file, using string representations of elements.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.rdd.UnionRDD#splits" data-isabs="false">
+ <a id="splits:Array[Split]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">splits</span><span class="result">: <span name="scala.Array" class="extype">Array</span>[<a name="spark.Split" class="extype" href="../Split.html">Split</a>]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Set of partitions in this RDD.</p><div class="fullcomment"><div class="comment cmt"><p>Set of partitions in this RDD.</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.rdd.UnionRDD" class="extype" href="">UnionRDD</a> → <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.rdd.UnionRDD#splits_" data-isabs="false">
+ <a id="splits_:Array[Split]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">val</span>
+ </span>
+ <span class="symbol">
+ <span class="name">splits_</span><span class="result">: <span name="scala.Array" class="extype">Array</span>[<a name="spark.Split" class="extype" href="../Split.html">Split</a>]</span>
+ </span>
+ </h4>
+
+ </li><li visbl="pub" name="scala.AnyRef#synchronized" data-isabs="false">
+ <a id="synchronized[T0](⇒ T0):T0"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">synchronized</span><span class="tparams">[<span name="T0">T0</span>]</span><span class="params">(<span name="arg0">arg0: ⇒ T0</span>)</span><span class="result">: T0</span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef</dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#take" data-isabs="false">
+ <a id="take(Int):Array[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">take</span><span class="params">(<span name="num">num: <span name="scala.Int" class="extype">Int</span></span>)</span><span class="result">: <span name="scala.Array" class="extype">Array</span>[T]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Take the first num elements of the RDD.</p><div class="fullcomment"><div class="comment cmt"><p>Take the first num elements of the RDD. This currently scans the partitions *one by one*, so
+it will be slow if a lot of partitions are required. In that case, use collect() to get the
+whole RDD instead.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#takeSample" data-isabs="false">
+ <a id="takeSample(Boolean,Int,Int):Array[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">takeSample</span><span class="params">(<span name="withReplacement">withReplacement: <span name="scala.Boolean" class="extype">Boolean</span></span>, <span name="num">num: <span name="scala.Int" class="extype">Int</span></span>, <span name="seed">seed: <span name="scala.Int" class="extype">Int</span></span>)</span><span class="result">: <span name="scala.Array" class="extype">Array</span>[T]</span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#toArray" data-isabs="false">
+ <a id="toArray():Array[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">toArray</span><span class="params">()</span><span class="result">: <span name="scala.Array" class="extype">Array</span>[T]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return an array that contains all of the elements in this RDD.</p><div class="fullcomment"><div class="comment cmt"><p>Return an array that contains all of the elements in this RDD.
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="scala.AnyRef#toString" data-isabs="false">
+ <a id="toString():String"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">toString</span><span class="params">()</span><span class="result">: <span name="java.lang.String" class="extype">String</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef → Any</dd></dl></div>
+ </li><li visbl="pub" name="spark.RDD#union" data-isabs="false">
+ <a id="union(RDD[T]):RDD[T]"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier"></span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">union</span><span class="params">(<span name="other">other: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T]</span>)</span><span class="result">: <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T]</span>
+ </span>
+ </h4>
+ <p class="shortcomment cmt">Return the union of this RDD and another one.</p><div class="fullcomment"><div class="comment cmt"><p>Return the union of this RDD and another one. Any identical elements will appear multiple
+times (use <code>.distinct()</code> to eliminate them).
+</p></div><dl class="attributes block"> <dt>Definition Classes</dt><dd><a name="spark.RDD" class="extype" href="../RDD.html">RDD</a></dd></dl></div>
+ </li><li visbl="pub" name="scala.AnyRef#wait" data-isabs="false">
+ <a id="wait():Unit"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">wait</span><span class="params">()</span><span class="result">: <span name="scala.Unit" class="extype">Unit</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef</dd><dt>Annotations</dt><dd>
+ <span class="name">@throws</span><span class="args">()</span>
+
+ </dd></dl></div>
+ </li><li visbl="pub" name="scala.AnyRef#wait" data-isabs="false">
+ <a id="wait(Long,Int):Unit"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">wait</span><span class="params">(<span name="arg0">arg0: <span name="scala.Long" class="extype">Long</span></span>, <span name="arg1">arg1: <span name="scala.Int" class="extype">Int</span></span>)</span><span class="result">: <span name="scala.Unit" class="extype">Unit</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef</dd><dt>Annotations</dt><dd>
+ <span class="name">@throws</span><span class="args">()</span>
+
+ </dd></dl></div>
+ </li><li visbl="pub" name="scala.AnyRef#wait" data-isabs="false">
+ <a id="wait(Long):Unit"></a>
+ <h4 class="signature">
+ <span class="modifier_kind">
+ <span class="modifier">final </span>
+ <span class="kind">def</span>
+ </span>
+ <span class="symbol">
+ <span class="name">wait</span><span class="params">(<span name="arg0">arg0: <span name="scala.Long" class="extype">Long</span></span>)</span><span class="result">: <span name="scala.Unit" class="extype">Unit</span></span>
+ </span>
+ </h4>
+ <div class="fullcomment"><dl class="attributes block"> <dt>Definition Classes</dt><dd>AnyRef</dd><dt>Annotations</dt><dd>
+ <span class="name">@throws</span><span class="args">()</span>
+
+ </dd></dl></div>
+ </li></ol>
+ </div>
+
+
+ </div>
+
+ <div id="inheritedMembers">
+ <div name="spark.RDD" class="parent">
+ <h3>Inherited from <a name="spark.RDD" class="extype" href="../RDD.html">RDD</a>[T]</h3>
+ </div><div name="scala.Serializable" class="parent">
+ <h3>Inherited from <span name="scala.Serializable" class="extype">Serializable</span></h3>
+ </div><div name="java.io.Serializable" class="parent">
+ <h3>Inherited from <span name="java.io.Serializable" class="extype">Serializable</span></h3>
+ </div><div name="scala.AnyRef" class="parent">
+ <h3>Inherited from AnyRef</h3>
+ </div><div name="scala.Any" class="parent">
+ <h3>Inherited from <span name="scala.Any" class="extype">Any</span></h3>
+ </div>
+ </div>
+
+ </div>
+
+ <div id="tooltip"></div>
+
+ <div id="footer"> </div>
+
+
+ </body>
+ </html> \ No newline at end of file