summaryrefslogtreecommitdiff
path: root/site/docs/1.5.0/api/python/index.html
blob: 9e88fa80ab14914da7a9c35f9b9403f088ed88f7 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
  "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">


<html xmlns="http://www.w3.org/1999/xhtml">
  <head>
    <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
    
    <title>Welcome to Spark Python API Docs! &mdash; PySpark 1.5.0 documentation</title>
    
    <link rel="stylesheet" href="_static/nature.css" type="text/css" />
    <link rel="stylesheet" href="_static/pygments.css" type="text/css" />
    
    <script type="text/javascript">
      var DOCUMENTATION_OPTIONS = {
        URL_ROOT:    './',
        VERSION:     '1.5.0',
        COLLAPSE_INDEX: false,
        FILE_SUFFIX: '.html',
        HAS_SOURCE:  true
      };
    </script>
    <script type="text/javascript" src="_static/jquery.js"></script>
    <script type="text/javascript" src="_static/underscore.js"></script>
    <script type="text/javascript" src="_static/doctools.js"></script>
    <link rel="top" title="PySpark 1.5.0 documentation" href="#" />
    <link rel="next" title="pyspark package" href="pyspark.html" /> 
  </head>
  <body role="document">
    <div class="related" role="navigation" aria-label="related navigation">
      <h3>Navigation</h3>
      <ul>
        <li class="right" style="margin-right: 10px">
          <a href="pyspark.html" title="pyspark package"
             accesskey="N">next</a></li>
        <li class="nav-item nav-item-0"><a href="#">PySpark 1.5.0 documentation</a> &raquo;</li> 
      </ul>
    </div>  

    <div class="document">
      <div class="documentwrapper">
        <div class="bodywrapper">
          <div class="body" role="main">
            
  <div class="section" id="welcome-to-spark-python-api-docs">
<h1>Welcome to Spark Python API Docs!<a class="headerlink" href="#welcome-to-spark-python-api-docs" title="Permalink to this headline"></a></h1>
<p>Contents:</p>
<div class="toctree-wrapper compound">
<ul>
<li class="toctree-l1"><a class="reference internal" href="pyspark.html">pyspark package</a><ul>
<li class="toctree-l2"><a class="reference internal" href="pyspark.html#subpackages">Subpackages</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.html#module-pyspark">Contents</a></li>
</ul>
</li>
<li class="toctree-l1"><a class="reference internal" href="pyspark.sql.html">pyspark.sql module</a><ul>
<li class="toctree-l2"><a class="reference internal" href="pyspark.sql.html#module-pyspark.sql">Module Context</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.sql.html#module-pyspark.sql.types">pyspark.sql.types module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.sql.html#module-pyspark.sql.functions">pyspark.sql.functions module</a></li>
</ul>
</li>
<li class="toctree-l1"><a class="reference internal" href="pyspark.streaming.html">pyspark.streaming module</a><ul>
<li class="toctree-l2"><a class="reference internal" href="pyspark.streaming.html#module-pyspark.streaming">Module contents</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.streaming.html#module-pyspark.streaming.kafka">pyspark.streaming.kafka module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.streaming.html#module-pyspark.streaming.kinesis">pyspark.streaming.kinesis module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.streaming.html#module-pyspark.streaming.flume">pyspark.streaming.flume.module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.streaming.html#module-pyspark.streaming.mqtt">pyspark.streaming.mqtt module</a></li>
</ul>
</li>
<li class="toctree-l1"><a class="reference internal" href="pyspark.ml.html">pyspark.ml package</a><ul>
<li class="toctree-l2"><a class="reference internal" href="pyspark.ml.html#module-pyspark.ml">ML Pipeline APIs</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.ml.html#module-pyspark.ml.param">pyspark.ml.param module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.ml.html#module-pyspark.ml.feature">pyspark.ml.feature module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.ml.html#module-pyspark.ml.classification">pyspark.ml.classification module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.ml.html#module-pyspark.ml.clustering">pyspark.ml.clustering module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.ml.html#module-pyspark.ml.recommendation">pyspark.ml.recommendation module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.ml.html#module-pyspark.ml.regression">pyspark.ml.regression module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.ml.html#module-pyspark.ml.tuning">pyspark.ml.tuning module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.ml.html#module-pyspark.ml.evaluation">pyspark.ml.evaluation module</a></li>
</ul>
</li>
<li class="toctree-l1"><a class="reference internal" href="pyspark.mllib.html">pyspark.mllib package</a><ul>
<li class="toctree-l2"><a class="reference internal" href="pyspark.mllib.html#module-pyspark.mllib.classification">pyspark.mllib.classification module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.mllib.html#module-pyspark.mllib.clustering">pyspark.mllib.clustering module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.mllib.html#module-pyspark.mllib.evaluation">pyspark.mllib.evaluation module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.mllib.html#module-pyspark.mllib.feature">pyspark.mllib.feature module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.mllib.html#module-pyspark.mllib.fpm">pyspark.mllib.fpm module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.mllib.html#module-pyspark.mllib.linalg">pyspark.mllib.linalg module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.mllib.html#module-pyspark.mllib.linalg.distributed">pyspark.mllib.linalg.distributed module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.mllib.html#module-pyspark.mllib.random">pyspark.mllib.random module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.mllib.html#module-pyspark.mllib.recommendation">pyspark.mllib.recommendation module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.mllib.html#module-pyspark.mllib.regression">pyspark.mllib.regression module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.mllib.html#module-pyspark.mllib.stat">pyspark.mllib.stat module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.mllib.html#module-pyspark.mllib.tree">pyspark.mllib.tree module</a></li>
<li class="toctree-l2"><a class="reference internal" href="pyspark.mllib.html#module-pyspark.mllib.util">pyspark.mllib.util module</a></li>
</ul>
</li>
</ul>
</div>
<div class="section" id="core-classes">
<h2>Core classes:<a class="headerlink" href="#core-classes" title="Permalink to this headline"></a></h2>
<blockquote>
<div><p><a class="reference internal" href="pyspark.html#pyspark.SparkContext" title="pyspark.SparkContext"><code class="xref py py-class docutils literal"><span class="pre">pyspark.SparkContext</span></code></a></p>
<p>Main entry point for Spark functionality.</p>
<p><a class="reference internal" href="pyspark.html#pyspark.RDD" title="pyspark.RDD"><code class="xref py py-class docutils literal"><span class="pre">pyspark.RDD</span></code></a></p>
<p>A Resilient Distributed Dataset (RDD), the basic abstraction in Spark.</p>
<p><a class="reference internal" href="pyspark.streaming.html#pyspark.streaming.StreamingContext" title="pyspark.streaming.StreamingContext"><code class="xref py py-class docutils literal"><span class="pre">pyspark.streaming.StreamingContext</span></code></a></p>
<p>Main entry point for Spark Streaming functionality.</p>
<p><a class="reference internal" href="pyspark.streaming.html#pyspark.streaming.DStream" title="pyspark.streaming.DStream"><code class="xref py py-class docutils literal"><span class="pre">pyspark.streaming.DStream</span></code></a></p>
<p>A Discretized Stream (DStream), the basic abstraction in Spark Streaming.</p>
<p><a class="reference internal" href="pyspark.sql.html#pyspark.sql.SQLContext" title="pyspark.sql.SQLContext"><code class="xref py py-class docutils literal"><span class="pre">pyspark.sql.SQLContext</span></code></a></p>
<p>Main entry point for DataFrame and SQL functionality.</p>
<p><a class="reference internal" href="pyspark.sql.html#pyspark.sql.DataFrame" title="pyspark.sql.DataFrame"><code class="xref py py-class docutils literal"><span class="pre">pyspark.sql.DataFrame</span></code></a></p>
<p>A distributed collection of data grouped into named columns.</p>
</div></blockquote>
</div>
</div>
<div class="section" id="indices-and-tables">
<h1>Indices and tables<a class="headerlink" href="#indices-and-tables" title="Permalink to this headline"></a></h1>
<ul class="simple">
<li><a class="reference internal" href="search.html"><span>Search Page</span></a></li>
</ul>
</div>


          </div>
        </div>
      </div>
      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
        <div class="sphinxsidebarwrapper">
            <p class="logo"><a href="#">
              <img class="logo" src="_static/spark-logo-hd.png" alt="Logo"/>
            </a></p>
  <h3><a href="#">Table Of Contents</a></h3>
  <ul>
<li><a class="reference internal" href="#">Welcome to Spark Python API Docs!</a><ul>
<li><a class="reference internal" href="#core-classes">Core classes:</a></li>
</ul>
</li>
<li><a class="reference internal" href="#indices-and-tables">Indices and tables</a></li>
</ul>

  <h4>Next topic</h4>
  <p class="topless"><a href="pyspark.html"
                        title="next chapter">pyspark package</a></p>
  <div role="note" aria-label="source link">
    <h3>This Page</h3>
    <ul class="this-page-menu">
      <li><a href="_sources/index.txt"
            rel="nofollow">Show Source</a></li>
    </ul>
   </div>
<div id="searchbox" style="display: none" role="search">
  <h3>Quick search</h3>
    <form class="search" action="search.html" method="get">
      <input type="text" name="q" />
      <input type="submit" value="Go" />
      <input type="hidden" name="check_keywords" value="yes" />
      <input type="hidden" name="area" value="default" />
    </form>
    <p class="searchtip" style="font-size: 90%">
    Enter search terms or a module, class or function name.
    </p>
</div>
<script type="text/javascript">$('#searchbox').show(0);</script>
        </div>
      </div>
      <div class="clearer"></div>
    </div>
    <div class="related" role="navigation" aria-label="related navigation">
      <h3>Navigation</h3>
      <ul>
        <li class="right" style="margin-right: 10px">
          <a href="pyspark.html" title="pyspark package"
             >next</a></li>
        <li class="nav-item nav-item-0"><a href="#">PySpark 1.5.0 documentation</a> &raquo;</li> 
      </ul>
    </div>
    <div class="footer" role="contentinfo">
        &copy; Copyright .
      Created using <a href="http://sphinx-doc.org/">Sphinx</a> 1.3.1.
    </div>
  </body>
</html>