summaryrefslogtreecommitdiff
path: root/site/docs/1.0.1/api/python/pyspark.serializers-pysrc.html
diff options
context:
space:
mode:
authorPatrick Wendell <pwendell@apache.org>2014-07-11 17:23:23 +0000
committerPatrick Wendell <pwendell@apache.org>2014-07-11 17:23:23 +0000
commit0beac4e243f85e71554fe04093b09eb1745fea82 (patch)
treebc20d10426c5d57e2f189305865dc2bbec447923 /site/docs/1.0.1/api/python/pyspark.serializers-pysrc.html
parentddec2123ba6ab95543d1b250d4f20fb811c48f09 (diff)
downloadspark-website-0beac4e243f85e71554fe04093b09eb1745fea82.tar.gz
spark-website-0beac4e243f85e71554fe04093b09eb1745fea82.tar.bz2
spark-website-0beac4e243f85e71554fe04093b09eb1745fea82.zip
Updating docs for 1.0.1 release
Diffstat (limited to 'site/docs/1.0.1/api/python/pyspark.serializers-pysrc.html')
-rw-r--r--site/docs/1.0.1/api/python/pyspark.serializers-pysrc.html485
1 files changed, 485 insertions, 0 deletions
diff --git a/site/docs/1.0.1/api/python/pyspark.serializers-pysrc.html b/site/docs/1.0.1/api/python/pyspark.serializers-pysrc.html
new file mode 100644
index 000000000..ee71e607a
--- /dev/null
+++ b/site/docs/1.0.1/api/python/pyspark.serializers-pysrc.html
@@ -0,0 +1,485 @@
+<?xml version="1.0" encoding="ascii"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
+ "DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+ <title>pyspark.serializers</title>
+ <link rel="stylesheet" href="epydoc.css" type="text/css" />
+ <script type="text/javascript" src="epydoc.js"></script>
+</head>
+
+<body bgcolor="white" text="black" link="blue" vlink="#204080"
+ alink="#204080">
+<!-- ==================== NAVIGATION BAR ==================== -->
+<table class="navbar" border="0" width="100%" cellpadding="0"
+ bgcolor="#a0c0ff" cellspacing="0">
+ <tr valign="middle">
+ <!-- Home link -->
+ <th>&nbsp;&nbsp;&nbsp;<a
+ href="pyspark-module.html">Home</a>&nbsp;&nbsp;&nbsp;</th>
+
+ <!-- Tree link -->
+ <th>&nbsp;&nbsp;&nbsp;<a
+ href="module-tree.html">Trees</a>&nbsp;&nbsp;&nbsp;</th>
+
+ <!-- Index link -->
+ <th>&nbsp;&nbsp;&nbsp;<a
+ href="identifier-index.html">Indices</a>&nbsp;&nbsp;&nbsp;</th>
+
+ <!-- Help link -->
+ <th>&nbsp;&nbsp;&nbsp;<a
+ href="help.html">Help</a>&nbsp;&nbsp;&nbsp;</th>
+
+ <!-- Project homepage -->
+ <th class="navbar" align="right" width="100%">
+ <table border="0" cellpadding="0" cellspacing="0">
+ <tr><th class="navbar" align="center"
+ ><a class="navbar" target="_top" href="http://spark.apache.org">Spark 1.0.0 Python API Docs</a></th>
+ </tr></table></th>
+ </tr>
+</table>
+<table width="100%" cellpadding="0" cellspacing="0">
+ <tr valign="top">
+ <td width="100%">
+ <span class="breadcrumbs">
+ <a href="pyspark-module.html">Package&nbsp;pyspark</a> ::
+ Module&nbsp;serializers
+ </span>
+ </td>
+ <td>
+ <table cellpadding="0" cellspacing="0">
+ <!-- hide/show private -->
+ <tr><td align="right"><span class="options"
+ >[<a href="frames.html" target="_top">frames</a
+ >]&nbsp;|&nbsp;<a href="pyspark.serializers-pysrc.html"
+ target="_top">no&nbsp;frames</a>]</span></td></tr>
+ </table>
+ </td>
+ </tr>
+</table>
+<h1 class="epydoc">Source Code for <a href="pyspark.serializers-module.html">Module pyspark.serializers</a></h1>
+<pre class="py-src">
+<a name="L1"></a><tt class="py-lineno"> 1</tt> <tt class="py-line"><tt class="py-comment">#</tt> </tt>
+<a name="L2"></a><tt class="py-lineno"> 2</tt> <tt class="py-line"><tt class="py-comment"># Licensed to the Apache Software Foundation (ASF) under one or more</tt> </tt>
+<a name="L3"></a><tt class="py-lineno"> 3</tt> <tt class="py-line"><tt class="py-comment"># contributor license agreements. See the NOTICE file distributed with</tt> </tt>
+<a name="L4"></a><tt class="py-lineno"> 4</tt> <tt class="py-line"><tt class="py-comment"># this work for additional information regarding copyright ownership.</tt> </tt>
+<a name="L5"></a><tt class="py-lineno"> 5</tt> <tt class="py-line"><tt class="py-comment"># The ASF licenses this file to You under the Apache License, Version 2.0</tt> </tt>
+<a name="L6"></a><tt class="py-lineno"> 6</tt> <tt class="py-line"><tt class="py-comment"># (the "License"); you may not use this file except in compliance with</tt> </tt>
+<a name="L7"></a><tt class="py-lineno"> 7</tt> <tt class="py-line"><tt class="py-comment"># the License. You may obtain a copy of the License at</tt> </tt>
+<a name="L8"></a><tt class="py-lineno"> 8</tt> <tt class="py-line"><tt class="py-comment">#</tt> </tt>
+<a name="L9"></a><tt class="py-lineno"> 9</tt> <tt class="py-line"><tt class="py-comment"># http://www.apache.org/licenses/LICENSE-2.0</tt> </tt>
+<a name="L10"></a><tt class="py-lineno"> 10</tt> <tt class="py-line"><tt class="py-comment">#</tt> </tt>
+<a name="L11"></a><tt class="py-lineno"> 11</tt> <tt class="py-line"><tt class="py-comment"># Unless required by applicable law or agreed to in writing, software</tt> </tt>
+<a name="L12"></a><tt class="py-lineno"> 12</tt> <tt class="py-line"><tt class="py-comment"># distributed under the License is distributed on an "AS IS" BASIS,</tt> </tt>
+<a name="L13"></a><tt class="py-lineno"> 13</tt> <tt class="py-line"><tt class="py-comment"># WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.</tt> </tt>
+<a name="L14"></a><tt class="py-lineno"> 14</tt> <tt class="py-line"><tt class="py-comment"># See the License for the specific language governing permissions and</tt> </tt>
+<a name="L15"></a><tt class="py-lineno"> 15</tt> <tt class="py-line"><tt class="py-comment"># limitations under the License.</tt> </tt>
+<a name="L16"></a><tt class="py-lineno"> 16</tt> <tt class="py-line"><tt class="py-comment">#</tt> </tt>
+<a name="L17"></a><tt class="py-lineno"> 17</tt> <tt class="py-line"> </tt>
+<a name="L18"></a><tt class="py-lineno"> 18</tt> <tt class="py-line"><tt class="py-docstring">"""</tt> </tt>
+<a name="L19"></a><tt class="py-lineno"> 19</tt> <tt class="py-line"><tt class="py-docstring">PySpark supports custom serializers for transferring data; this can improve</tt> </tt>
+<a name="L20"></a><tt class="py-lineno"> 20</tt> <tt class="py-line"><tt class="py-docstring">performance.</tt> </tt>
+<a name="L21"></a><tt class="py-lineno"> 21</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
+<a name="L22"></a><tt class="py-lineno"> 22</tt> <tt class="py-line"><tt class="py-docstring">By default, PySpark uses L{PickleSerializer} to serialize objects using Python's</tt> </tt>
+<a name="L23"></a><tt class="py-lineno"> 23</tt> <tt class="py-line"><tt class="py-docstring">C{cPickle} serializer, which can serialize nearly any Python object.</tt> </tt>
+<a name="L24"></a><tt class="py-lineno"> 24</tt> <tt class="py-line"><tt class="py-docstring">Other serializers, like L{MarshalSerializer}, support fewer datatypes but can be</tt> </tt>
+<a name="L25"></a><tt class="py-lineno"> 25</tt> <tt class="py-line"><tt class="py-docstring">faster.</tt> </tt>
+<a name="L26"></a><tt class="py-lineno"> 26</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
+<a name="L27"></a><tt class="py-lineno"> 27</tt> <tt class="py-line"><tt class="py-docstring">The serializer is chosen when creating L{SparkContext}:</tt> </tt>
+<a name="L28"></a><tt class="py-lineno"> 28</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
+<a name="L29"></a><tt class="py-lineno"> 29</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; from pyspark.context import SparkContext</tt> </tt>
+<a name="L30"></a><tt class="py-lineno"> 30</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; from pyspark.serializers import MarshalSerializer</tt> </tt>
+<a name="L31"></a><tt class="py-lineno"> 31</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; sc = SparkContext('local', 'test', serializer=MarshalSerializer())</tt> </tt>
+<a name="L32"></a><tt class="py-lineno"> 32</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; sc.parallelize(list(range(1000))).map(lambda x: 2 * x).take(10)</tt> </tt>
+<a name="L33"></a><tt class="py-lineno"> 33</tt> <tt class="py-line"><tt class="py-docstring">[0, 2, 4, 6, 8, 10, 12, 14, 16, 18]</tt> </tt>
+<a name="L34"></a><tt class="py-lineno"> 34</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; sc.stop()</tt> </tt>
+<a name="L35"></a><tt class="py-lineno"> 35</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
+<a name="L36"></a><tt class="py-lineno"> 36</tt> <tt class="py-line"><tt class="py-docstring">By default, PySpark serialize objects in batches; the batch size can be</tt> </tt>
+<a name="L37"></a><tt class="py-lineno"> 37</tt> <tt class="py-line"><tt class="py-docstring">controlled through SparkContext's C{batchSize} parameter</tt> </tt>
+<a name="L38"></a><tt class="py-lineno"> 38</tt> <tt class="py-line"><tt class="py-docstring">(the default size is 1024 objects):</tt> </tt>
+<a name="L39"></a><tt class="py-lineno"> 39</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
+<a name="L40"></a><tt class="py-lineno"> 40</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; sc = SparkContext('local', 'test', batchSize=2)</tt> </tt>
+<a name="L41"></a><tt class="py-lineno"> 41</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; rdd = sc.parallelize(range(16), 4).map(lambda x: x)</tt> </tt>
+<a name="L42"></a><tt class="py-lineno"> 42</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
+<a name="L43"></a><tt class="py-lineno"> 43</tt> <tt class="py-line"><tt class="py-docstring">Behind the scenes, this creates a JavaRDD with four partitions, each of</tt> </tt>
+<a name="L44"></a><tt class="py-lineno"> 44</tt> <tt class="py-line"><tt class="py-docstring">which contains two batches of two objects:</tt> </tt>
+<a name="L45"></a><tt class="py-lineno"> 45</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
+<a name="L46"></a><tt class="py-lineno"> 46</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; rdd.glom().collect()</tt> </tt>
+<a name="L47"></a><tt class="py-lineno"> 47</tt> <tt class="py-line"><tt class="py-docstring">[[0, 1, 2, 3], [4, 5, 6, 7], [8, 9, 10, 11], [12, 13, 14, 15]]</tt> </tt>
+<a name="L48"></a><tt class="py-lineno"> 48</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; rdd._jrdd.count()</tt> </tt>
+<a name="L49"></a><tt class="py-lineno"> 49</tt> <tt class="py-line"><tt class="py-docstring">8L</tt> </tt>
+<a name="L50"></a><tt class="py-lineno"> 50</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; sc.stop()</tt> </tt>
+<a name="L51"></a><tt class="py-lineno"> 51</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
+<a name="L52"></a><tt class="py-lineno"> 52</tt> <tt class="py-line"><tt class="py-docstring">A batch size of -1 uses an unlimited batch size, and a size of 1 disables</tt> </tt>
+<a name="L53"></a><tt class="py-lineno"> 53</tt> <tt class="py-line"><tt class="py-docstring">batching:</tt> </tt>
+<a name="L54"></a><tt class="py-lineno"> 54</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
+<a name="L55"></a><tt class="py-lineno"> 55</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; sc = SparkContext('local', 'test', batchSize=1)</tt> </tt>
+<a name="L56"></a><tt class="py-lineno"> 56</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; rdd = sc.parallelize(range(16), 4).map(lambda x: x)</tt> </tt>
+<a name="L57"></a><tt class="py-lineno"> 57</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; rdd.glom().collect()</tt> </tt>
+<a name="L58"></a><tt class="py-lineno"> 58</tt> <tt class="py-line"><tt class="py-docstring">[[0, 1, 2, 3], [4, 5, 6, 7], [8, 9, 10, 11], [12, 13, 14, 15]]</tt> </tt>
+<a name="L59"></a><tt class="py-lineno"> 59</tt> <tt class="py-line"><tt class="py-docstring">&gt;&gt;&gt; rdd._jrdd.count()</tt> </tt>
+<a name="L60"></a><tt class="py-lineno"> 60</tt> <tt class="py-line"><tt class="py-docstring">16L</tt> </tt>
+<a name="L61"></a><tt class="py-lineno"> 61</tt> <tt class="py-line"><tt class="py-docstring">"""</tt> </tt>
+<a name="L62"></a><tt class="py-lineno"> 62</tt> <tt class="py-line"> </tt>
+<a name="L63"></a><tt class="py-lineno"> 63</tt> <tt class="py-line"><tt class="py-keyword">import</tt> <tt class="py-name">cPickle</tt> </tt>
+<a name="L64"></a><tt class="py-lineno"> 64</tt> <tt class="py-line"><tt class="py-keyword">from</tt> <tt class="py-name">itertools</tt> <tt class="py-keyword">import</tt> <tt class="py-name">chain</tt><tt class="py-op">,</tt> <tt class="py-name">izip</tt><tt class="py-op">,</tt> <tt class="py-name">product</tt> </tt>
+<a name="L65"></a><tt class="py-lineno"> 65</tt> <tt class="py-line"><tt class="py-keyword">import</tt> <tt class="py-name">marshal</tt> </tt>
+<a name="L66"></a><tt class="py-lineno"> 66</tt> <tt class="py-line"><tt class="py-keyword">import</tt> <tt class="py-name">struct</tt> </tt>
+<a name="L67"></a><tt class="py-lineno"> 67</tt> <tt class="py-line"><tt class="py-keyword">import</tt> <tt class="py-name">sys</tt> </tt>
+<a name="L68"></a><tt class="py-lineno"> 68</tt> <tt class="py-line"><tt class="py-keyword">from</tt> <tt id="link-0" class="py-name" targets="Package pyspark=pyspark-module.html"><a title="pyspark" class="py-name" href="#" onclick="return doclink('link-0', 'pyspark', 'link-0');">pyspark</a></tt> <tt class="py-keyword">import</tt> <tt class="py-name">cloudpickle</tt> </tt>
+<a name="L69"></a><tt class="py-lineno"> 69</tt> <tt class="py-line"> </tt>
+<a name="L70"></a><tt class="py-lineno"> 70</tt> <tt class="py-line"> </tt>
+<a name="L71"></a><tt class="py-lineno"> 71</tt> <tt class="py-line"><tt class="py-name">__all__</tt> <tt class="py-op">=</tt> <tt class="py-op">[</tt><tt class="py-string">"PickleSerializer"</tt><tt class="py-op">,</tt> <tt class="py-string">"MarshalSerializer"</tt><tt class="py-op">]</tt> </tt>
+<a name="L72"></a><tt class="py-lineno"> 72</tt> <tt class="py-line"> </tt>
+<a name="L73"></a><tt class="py-lineno"> 73</tt> <tt class="py-line"> </tt>
+<a name="SpecialLengths"></a><div id="SpecialLengths-def"><a name="L74"></a><tt class="py-lineno"> 74</tt> <a class="py-toggle" href="#" id="SpecialLengths-toggle" onclick="return toggle('SpecialLengths');">-</a><tt class="py-line"><tt class="py-keyword">class</tt> <a class="py-def-name" href="pyspark.serializers.SpecialLengths-class.html">SpecialLengths</a><tt class="py-op">(</tt><tt class="py-base-class">object</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="SpecialLengths-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="SpecialLengths-expanded"><a name="L75"></a><tt class="py-lineno"> 75</tt> <tt class="py-line"> <tt class="py-name">END_OF_DATA_SECTION</tt> <tt class="py-op">=</tt> <tt class="py-op">-</tt><tt class="py-number">1</tt> </tt>
+<a name="L76"></a><tt class="py-lineno"> 76</tt> <tt class="py-line"> <tt class="py-name">PYTHON_EXCEPTION_THROWN</tt> <tt class="py-op">=</tt> <tt class="py-op">-</tt><tt class="py-number">2</tt> </tt>
+<a name="L77"></a><tt class="py-lineno"> 77</tt> <tt class="py-line"> <tt class="py-name">TIMING_DATA</tt> <tt class="py-op">=</tt> <tt class="py-op">-</tt><tt class="py-number">3</tt> </tt>
+</div><a name="L78"></a><tt class="py-lineno"> 78</tt> <tt class="py-line"> </tt>
+<a name="L79"></a><tt class="py-lineno"> 79</tt> <tt class="py-line"> </tt>
+<a name="Serializer"></a><div id="Serializer-def"><a name="L80"></a><tt class="py-lineno"> 80</tt> <a class="py-toggle" href="#" id="Serializer-toggle" onclick="return toggle('Serializer');">-</a><tt class="py-line"><tt class="py-keyword">class</tt> <a class="py-def-name" href="pyspark.serializers.Serializer-class.html">Serializer</a><tt class="py-op">(</tt><tt class="py-base-class">object</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="Serializer-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="Serializer-expanded"><a name="L81"></a><tt class="py-lineno"> 81</tt> <tt class="py-line"> </tt>
+<a name="Serializer.dump_stream"></a><div id="Serializer.dump_stream-def"><a name="L82"></a><tt class="py-lineno"> 82</tt> <a class="py-toggle" href="#" id="Serializer.dump_stream-toggle" onclick="return toggle('Serializer.dump_stream');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.Serializer-class.html#dump_stream">dump_stream</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">iterator</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="Serializer.dump_stream-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="Serializer.dump_stream-expanded"><a name="L83"></a><tt class="py-lineno"> 83</tt> <tt class="py-line"> <tt class="py-docstring">"""</tt> </tt>
+<a name="L84"></a><tt class="py-lineno"> 84</tt> <tt class="py-line"><tt class="py-docstring"> Serialize an iterator of objects to the output stream.</tt> </tt>
+<a name="L85"></a><tt class="py-lineno"> 85</tt> <tt class="py-line"><tt class="py-docstring"> """</tt> </tt>
+<a name="L86"></a><tt class="py-lineno"> 86</tt> <tt class="py-line"> <tt class="py-keyword">raise</tt> <tt class="py-name">NotImplementedError</tt> </tt>
+</div><a name="L87"></a><tt class="py-lineno"> 87</tt> <tt class="py-line"> </tt>
+<a name="Serializer.load_stream"></a><div id="Serializer.load_stream-def"><a name="L88"></a><tt class="py-lineno"> 88</tt> <a class="py-toggle" href="#" id="Serializer.load_stream-toggle" onclick="return toggle('Serializer.load_stream');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.Serializer-class.html#load_stream">load_stream</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="Serializer.load_stream-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="Serializer.load_stream-expanded"><a name="L89"></a><tt class="py-lineno"> 89</tt> <tt class="py-line"> <tt class="py-docstring">"""</tt> </tt>
+<a name="L90"></a><tt class="py-lineno"> 90</tt> <tt class="py-line"><tt class="py-docstring"> Return an iterator of deserialized objects from the input stream.</tt> </tt>
+<a name="L91"></a><tt class="py-lineno"> 91</tt> <tt class="py-line"><tt class="py-docstring"> """</tt> </tt>
+<a name="L92"></a><tt class="py-lineno"> 92</tt> <tt class="py-line"> <tt class="py-keyword">raise</tt> <tt class="py-name">NotImplementedError</tt> </tt>
+</div><a name="L93"></a><tt class="py-lineno"> 93</tt> <tt class="py-line"> </tt>
+<a name="L94"></a><tt class="py-lineno"> 94</tt> <tt class="py-line"> </tt>
+<a name="Serializer._load_stream_without_unbatching"></a><div id="Serializer._load_stream_without_unbatching-def"><a name="L95"></a><tt class="py-lineno"> 95</tt> <a class="py-toggle" href="#" id="Serializer._load_stream_without_unbatching-toggle" onclick="return toggle('Serializer._load_stream_without_unbatching');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.Serializer-class.html#_load_stream_without_unbatching">_load_stream_without_unbatching</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="Serializer._load_stream_without_unbatching-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="Serializer._load_stream_without_unbatching-expanded"><a name="L96"></a><tt class="py-lineno"> 96</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">load_stream</tt><tt class="py-op">(</tt><tt class="py-name">stream</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L97"></a><tt class="py-lineno"> 97</tt> <tt class="py-line"> </tt>
+<a name="L98"></a><tt class="py-lineno"> 98</tt> <tt class="py-line"> <tt class="py-comment"># Note: our notion of "equality" is that output generated by</tt> </tt>
+<a name="L99"></a><tt class="py-lineno"> 99</tt> <tt class="py-line"> <tt class="py-comment"># equal serializers can be deserialized using the same serializer.</tt> </tt>
+<a name="L100"></a><tt class="py-lineno">100</tt> <tt class="py-line"> </tt>
+<a name="L101"></a><tt class="py-lineno">101</tt> <tt class="py-line"> <tt class="py-comment"># This default implementation handles the simple cases;</tt> </tt>
+<a name="L102"></a><tt class="py-lineno">102</tt> <tt class="py-line"> <tt class="py-comment"># subclasses should override __eq__ as appropriate.</tt> </tt>
+<a name="L103"></a><tt class="py-lineno">103</tt> <tt class="py-line"> </tt>
+<a name="Serializer.__eq__"></a><div id="Serializer.__eq__-def"><a name="L104"></a><tt class="py-lineno">104</tt> <a class="py-toggle" href="#" id="Serializer.__eq__-toggle" onclick="return toggle('Serializer.__eq__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.Serializer-class.html#__eq__">__eq__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">other</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="Serializer.__eq__-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="Serializer.__eq__-expanded"><a name="L105"></a><tt class="py-lineno">105</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-name">isinstance</tt><tt class="py-op">(</tt><tt class="py-name">other</tt><tt class="py-op">,</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">__class__</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L106"></a><tt class="py-lineno">106</tt> <tt class="py-line"> </tt>
+<a name="Serializer.__ne__"></a><div id="Serializer.__ne__-def"><a name="L107"></a><tt class="py-lineno">107</tt> <a class="py-toggle" href="#" id="Serializer.__ne__-toggle" onclick="return toggle('Serializer.__ne__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.Serializer-class.html#__ne__">__ne__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">other</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="Serializer.__ne__-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="Serializer.__ne__-expanded"><a name="L108"></a><tt class="py-lineno">108</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-keyword">not</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt id="link-1" class="py-name" targets="Method pyspark.mllib.linalg.SparseVector.__eq__()=pyspark.mllib.linalg.SparseVector-class.html#__eq__"><a title="pyspark.mllib.linalg.SparseVector.__eq__" class="py-name" href="#" onclick="return doclink('link-1', '__eq__', 'link-1');">__eq__</a></tt><tt class="py-op">(</tt><tt class="py-name">other</tt><tt class="py-op">)</tt> </tt>
+</div></div><a name="L109"></a><tt class="py-lineno">109</tt> <tt class="py-line"> </tt>
+<a name="L110"></a><tt class="py-lineno">110</tt> <tt class="py-line"> </tt>
+<a name="FramedSerializer"></a><div id="FramedSerializer-def"><a name="L111"></a><tt class="py-lineno">111</tt> <a class="py-toggle" href="#" id="FramedSerializer-toggle" onclick="return toggle('FramedSerializer');">-</a><tt class="py-line"><tt class="py-keyword">class</tt> <a class="py-def-name" href="pyspark.serializers.FramedSerializer-class.html">FramedSerializer</a><tt class="py-op">(</tt><tt class="py-base-class">Serializer</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="FramedSerializer-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="FramedSerializer-expanded"><a name="L112"></a><tt class="py-lineno">112</tt> <tt class="py-line"> <tt class="py-docstring">"""</tt> </tt>
+<a name="L113"></a><tt class="py-lineno">113</tt> <tt class="py-line"><tt class="py-docstring"> Serializer that writes objects as a stream of (length, data) pairs,</tt> </tt>
+<a name="L114"></a><tt class="py-lineno">114</tt> <tt class="py-line"><tt class="py-docstring"> where C{length} is a 32-bit integer and data is C{length} bytes.</tt> </tt>
+<a name="L115"></a><tt class="py-lineno">115</tt> <tt class="py-line"><tt class="py-docstring"> """</tt> </tt>
+<a name="L116"></a><tt class="py-lineno">116</tt> <tt class="py-line"> </tt>
+<a name="FramedSerializer.__init__"></a><div id="FramedSerializer.__init__-def"><a name="L117"></a><tt class="py-lineno">117</tt> <a class="py-toggle" href="#" id="FramedSerializer.__init__-toggle" onclick="return toggle('FramedSerializer.__init__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.FramedSerializer-class.html#__init__">__init__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="FramedSerializer.__init__-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="FramedSerializer.__init__-expanded"><a name="L118"></a><tt class="py-lineno">118</tt> <tt class="py-line"> <tt class="py-comment"># On Python 2.6, we can't write bytearrays to streams, so we need to convert them</tt> </tt>
+<a name="L119"></a><tt class="py-lineno">119</tt> <tt class="py-line"> <tt class="py-comment"># to strings first. Check if the version number is that old.</tt> </tt>
+<a name="L120"></a><tt class="py-lineno">120</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">_only_write_strings</tt> <tt class="py-op">=</tt> <tt class="py-name">sys</tt><tt class="py-op">.</tt><tt class="py-name">version_info</tt><tt class="py-op">[</tt><tt class="py-number">0</tt><tt class="py-op">:</tt><tt class="py-number">2</tt><tt class="py-op">]</tt> <tt class="py-op">&lt;=</tt> <tt class="py-op">(</tt><tt class="py-number">2</tt><tt class="py-op">,</tt> <tt class="py-number">6</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L121"></a><tt class="py-lineno">121</tt> <tt class="py-line"> </tt>
+<a name="FramedSerializer.dump_stream"></a><div id="FramedSerializer.dump_stream-def"><a name="L122"></a><tt class="py-lineno">122</tt> <a class="py-toggle" href="#" id="FramedSerializer.dump_stream-toggle" onclick="return toggle('FramedSerializer.dump_stream');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.FramedSerializer-class.html#dump_stream">dump_stream</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">iterator</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="FramedSerializer.dump_stream-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="FramedSerializer.dump_stream-expanded"><a name="L123"></a><tt class="py-lineno">123</tt> <tt class="py-line"> <tt class="py-keyword">for</tt> <tt class="py-name">obj</tt> <tt class="py-keyword">in</tt> <tt class="py-name">iterator</tt><tt class="py-op">:</tt> </tt>
+<a name="L124"></a><tt class="py-lineno">124</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">_write_with_length</tt><tt class="py-op">(</tt><tt class="py-name">obj</tt><tt class="py-op">,</tt> <tt class="py-name">stream</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L125"></a><tt class="py-lineno">125</tt> <tt class="py-line"> </tt>
+<a name="FramedSerializer.load_stream"></a><div id="FramedSerializer.load_stream-def"><a name="L126"></a><tt class="py-lineno">126</tt> <a class="py-toggle" href="#" id="FramedSerializer.load_stream-toggle" onclick="return toggle('FramedSerializer.load_stream');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.FramedSerializer-class.html#load_stream">load_stream</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="FramedSerializer.load_stream-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="FramedSerializer.load_stream-expanded"><a name="L127"></a><tt class="py-lineno">127</tt> <tt class="py-line"> <tt class="py-keyword">while</tt> <tt class="py-name">True</tt><tt class="py-op">:</tt> </tt>
+<a name="L128"></a><tt class="py-lineno">128</tt> <tt class="py-line"> <tt class="py-keyword">try</tt><tt class="py-op">:</tt> </tt>
+<a name="L129"></a><tt class="py-lineno">129</tt> <tt class="py-line"> <tt class="py-keyword">yield</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">_read_with_length</tt><tt class="py-op">(</tt><tt class="py-name">stream</tt><tt class="py-op">)</tt> </tt>
+<a name="L130"></a><tt class="py-lineno">130</tt> <tt class="py-line"> <tt class="py-keyword">except</tt> <tt class="py-name">EOFError</tt><tt class="py-op">:</tt> </tt>
+<a name="L131"></a><tt class="py-lineno">131</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> </tt>
+</div><a name="L132"></a><tt class="py-lineno">132</tt> <tt class="py-line"> </tt>
+<a name="FramedSerializer._write_with_length"></a><div id="FramedSerializer._write_with_length-def"><a name="L133"></a><tt class="py-lineno">133</tt> <a class="py-toggle" href="#" id="FramedSerializer._write_with_length-toggle" onclick="return toggle('FramedSerializer._write_with_length');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.FramedSerializer-class.html#_write_with_length">_write_with_length</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">obj</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="FramedSerializer._write_with_length-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="FramedSerializer._write_with_length-expanded"><a name="L134"></a><tt class="py-lineno">134</tt> <tt class="py-line"> <tt class="py-name">serialized</tt> <tt class="py-op">=</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt id="link-2" class="py-name" targets="Variable pyspark.serializers.MarshalSerializer.dumps=pyspark.serializers.MarshalSerializer-class.html#dumps,Method pyspark.serializers.PickleSerializer.dumps()=pyspark.serializers.PickleSerializer-class.html#dumps"><a title="pyspark.serializers.MarshalSerializer.dumps
+pyspark.serializers.PickleSerializer.dumps" class="py-name" href="#" onclick="return doclink('link-2', 'dumps', 'link-2');">dumps</a></tt><tt class="py-op">(</tt><tt class="py-name">obj</tt><tt class="py-op">)</tt> </tt>
+<a name="L135"></a><tt class="py-lineno">135</tt> <tt class="py-line"> <tt class="py-name">write_int</tt><tt class="py-op">(</tt><tt class="py-name">len</tt><tt class="py-op">(</tt><tt class="py-name">serialized</tt><tt class="py-op">)</tt><tt class="py-op">,</tt> <tt class="py-name">stream</tt><tt class="py-op">)</tt> </tt>
+<a name="L136"></a><tt class="py-lineno">136</tt> <tt class="py-line"> <tt class="py-keyword">if</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">_only_write_strings</tt><tt class="py-op">:</tt> </tt>
+<a name="L137"></a><tt class="py-lineno">137</tt> <tt class="py-line"> <tt class="py-name">stream</tt><tt class="py-op">.</tt><tt class="py-name">write</tt><tt class="py-op">(</tt><tt class="py-name">str</tt><tt class="py-op">(</tt><tt class="py-name">serialized</tt><tt class="py-op">)</tt><tt class="py-op">)</tt> </tt>
+<a name="L138"></a><tt class="py-lineno">138</tt> <tt class="py-line"> <tt class="py-keyword">else</tt><tt class="py-op">:</tt> </tt>
+<a name="L139"></a><tt class="py-lineno">139</tt> <tt class="py-line"> <tt class="py-name">stream</tt><tt class="py-op">.</tt><tt class="py-name">write</tt><tt class="py-op">(</tt><tt class="py-name">serialized</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L140"></a><tt class="py-lineno">140</tt> <tt class="py-line"> </tt>
+<a name="FramedSerializer._read_with_length"></a><div id="FramedSerializer._read_with_length-def"><a name="L141"></a><tt class="py-lineno">141</tt> <a class="py-toggle" href="#" id="FramedSerializer._read_with_length-toggle" onclick="return toggle('FramedSerializer._read_with_length');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.FramedSerializer-class.html#_read_with_length">_read_with_length</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="FramedSerializer._read_with_length-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="FramedSerializer._read_with_length-expanded"><a name="L142"></a><tt class="py-lineno">142</tt> <tt class="py-line"> <tt class="py-name">length</tt> <tt class="py-op">=</tt> <tt class="py-name">read_int</tt><tt class="py-op">(</tt><tt class="py-name">stream</tt><tt class="py-op">)</tt> </tt>
+<a name="L143"></a><tt class="py-lineno">143</tt> <tt class="py-line"> <tt class="py-name">obj</tt> <tt class="py-op">=</tt> <tt class="py-name">stream</tt><tt class="py-op">.</tt><tt class="py-name">read</tt><tt class="py-op">(</tt><tt class="py-name">length</tt><tt class="py-op">)</tt> </tt>
+<a name="L144"></a><tt class="py-lineno">144</tt> <tt class="py-line"> <tt class="py-keyword">if</tt> <tt class="py-name">obj</tt> <tt class="py-op">==</tt> <tt class="py-string">""</tt><tt class="py-op">:</tt> </tt>
+<a name="L145"></a><tt class="py-lineno">145</tt> <tt class="py-line"> <tt class="py-keyword">raise</tt> <tt class="py-name">EOFError</tt> </tt>
+<a name="L146"></a><tt class="py-lineno">146</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt id="link-3" class="py-name" targets="Variable pyspark.serializers.MarshalSerializer.loads=pyspark.serializers.MarshalSerializer-class.html#loads,Variable pyspark.serializers.PickleSerializer.loads=pyspark.serializers.PickleSerializer-class.html#loads"><a title="pyspark.serializers.MarshalSerializer.loads
+pyspark.serializers.PickleSerializer.loads" class="py-name" href="#" onclick="return doclink('link-3', 'loads', 'link-3');">loads</a></tt><tt class="py-op">(</tt><tt class="py-name">obj</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L147"></a><tt class="py-lineno">147</tt> <tt class="py-line"> </tt>
+<a name="FramedSerializer.dumps"></a><div id="FramedSerializer.dumps-def"><a name="L148"></a><tt class="py-lineno">148</tt> <a class="py-toggle" href="#" id="FramedSerializer.dumps-toggle" onclick="return toggle('FramedSerializer.dumps');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.FramedSerializer-class.html#dumps">dumps</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">obj</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="FramedSerializer.dumps-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="FramedSerializer.dumps-expanded"><a name="L149"></a><tt class="py-lineno">149</tt> <tt class="py-line"> <tt class="py-docstring">"""</tt> </tt>
+<a name="L150"></a><tt class="py-lineno">150</tt> <tt class="py-line"><tt class="py-docstring"> Serialize an object into a byte array.</tt> </tt>
+<a name="L151"></a><tt class="py-lineno">151</tt> <tt class="py-line"><tt class="py-docstring"> When batching is used, this will be called with an array of objects.</tt> </tt>
+<a name="L152"></a><tt class="py-lineno">152</tt> <tt class="py-line"><tt class="py-docstring"> """</tt> </tt>
+<a name="L153"></a><tt class="py-lineno">153</tt> <tt class="py-line"> <tt class="py-keyword">raise</tt> <tt class="py-name">NotImplementedError</tt> </tt>
+</div><a name="L154"></a><tt class="py-lineno">154</tt> <tt class="py-line"> </tt>
+<a name="FramedSerializer.loads"></a><div id="FramedSerializer.loads-def"><a name="L155"></a><tt class="py-lineno">155</tt> <a class="py-toggle" href="#" id="FramedSerializer.loads-toggle" onclick="return toggle('FramedSerializer.loads');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.FramedSerializer-class.html#loads">loads</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">obj</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="FramedSerializer.loads-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="FramedSerializer.loads-expanded"><a name="L156"></a><tt class="py-lineno">156</tt> <tt class="py-line"> <tt class="py-docstring">"""</tt> </tt>
+<a name="L157"></a><tt class="py-lineno">157</tt> <tt class="py-line"><tt class="py-docstring"> Deserialize an object from a byte array.</tt> </tt>
+<a name="L158"></a><tt class="py-lineno">158</tt> <tt class="py-line"><tt class="py-docstring"> """</tt> </tt>
+<a name="L159"></a><tt class="py-lineno">159</tt> <tt class="py-line"> <tt class="py-keyword">raise</tt> <tt class="py-name">NotImplementedError</tt> </tt>
+</div></div><a name="L160"></a><tt class="py-lineno">160</tt> <tt class="py-line"> </tt>
+<a name="L161"></a><tt class="py-lineno">161</tt> <tt class="py-line"> </tt>
+<a name="BatchedSerializer"></a><div id="BatchedSerializer-def"><a name="L162"></a><tt class="py-lineno">162</tt> <a class="py-toggle" href="#" id="BatchedSerializer-toggle" onclick="return toggle('BatchedSerializer');">-</a><tt class="py-line"><tt class="py-keyword">class</tt> <a class="py-def-name" href="pyspark.serializers.BatchedSerializer-class.html">BatchedSerializer</a><tt class="py-op">(</tt><tt class="py-base-class">Serializer</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="BatchedSerializer-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="BatchedSerializer-expanded"><a name="L163"></a><tt class="py-lineno">163</tt> <tt class="py-line"> <tt class="py-docstring">"""</tt> </tt>
+<a name="L164"></a><tt class="py-lineno">164</tt> <tt class="py-line"><tt class="py-docstring"> Serializes a stream of objects in batches by calling its wrapped</tt> </tt>
+<a name="L165"></a><tt class="py-lineno">165</tt> <tt class="py-line"><tt class="py-docstring"> Serializer with streams of objects.</tt> </tt>
+<a name="L166"></a><tt class="py-lineno">166</tt> <tt class="py-line"><tt class="py-docstring"> """</tt> </tt>
+<a name="L167"></a><tt class="py-lineno">167</tt> <tt class="py-line"> </tt>
+<a name="L168"></a><tt class="py-lineno">168</tt> <tt class="py-line"> <tt class="py-name">UNLIMITED_BATCH_SIZE</tt> <tt class="py-op">=</tt> <tt class="py-op">-</tt><tt class="py-number">1</tt> </tt>
+<a name="L169"></a><tt class="py-lineno">169</tt> <tt class="py-line"> </tt>
+<a name="BatchedSerializer.__init__"></a><div id="BatchedSerializer.__init__-def"><a name="L170"></a><tt class="py-lineno">170</tt> <a class="py-toggle" href="#" id="BatchedSerializer.__init__-toggle" onclick="return toggle('BatchedSerializer.__init__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.BatchedSerializer-class.html#__init__">__init__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">serializer</tt><tt class="py-op">,</tt> <tt class="py-param">batchSize</tt><tt class="py-op">=</tt><tt class="py-name">UNLIMITED_BATCH_SIZE</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="BatchedSerializer.__init__-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="BatchedSerializer.__init__-expanded"><a name="L171"></a><tt class="py-lineno">171</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">serializer</tt> <tt class="py-op">=</tt> <tt class="py-name">serializer</tt> </tt>
+<a name="L172"></a><tt class="py-lineno">172</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">batchSize</tt> <tt class="py-op">=</tt> <tt class="py-name">batchSize</tt> </tt>
+</div><a name="L173"></a><tt class="py-lineno">173</tt> <tt class="py-line"> </tt>
+<a name="BatchedSerializer._batched"></a><div id="BatchedSerializer._batched-def"><a name="L174"></a><tt class="py-lineno">174</tt> <a class="py-toggle" href="#" id="BatchedSerializer._batched-toggle" onclick="return toggle('BatchedSerializer._batched');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.BatchedSerializer-class.html#_batched">_batched</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">iterator</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="BatchedSerializer._batched-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="BatchedSerializer._batched-expanded"><a name="L175"></a><tt class="py-lineno">175</tt> <tt class="py-line"> <tt class="py-keyword">if</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">batchSize</tt> <tt class="py-op">==</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">UNLIMITED_BATCH_SIZE</tt><tt class="py-op">:</tt> </tt>
+<a name="L176"></a><tt class="py-lineno">176</tt> <tt class="py-line"> <tt class="py-keyword">yield</tt> <tt class="py-name">list</tt><tt class="py-op">(</tt><tt class="py-name">iterator</tt><tt class="py-op">)</tt> </tt>
+<a name="L177"></a><tt class="py-lineno">177</tt> <tt class="py-line"> <tt class="py-keyword">else</tt><tt class="py-op">:</tt> </tt>
+<a name="L178"></a><tt class="py-lineno">178</tt> <tt class="py-line"> <tt class="py-name">items</tt> <tt class="py-op">=</tt> <tt class="py-op">[</tt><tt class="py-op">]</tt> </tt>
+<a name="L179"></a><tt class="py-lineno">179</tt> <tt class="py-line"> <tt id="link-4" class="py-name" targets="Method pyspark.rdd.RDD.count()=pyspark.rdd.RDD-class.html#count,Method pyspark.sql.SchemaRDD.count()=pyspark.sql.SchemaRDD-class.html#count,Method pyspark.statcounter.StatCounter.count()=pyspark.statcounter.StatCounter-class.html#count"><a title="pyspark.rdd.RDD.count
+pyspark.sql.SchemaRDD.count
+pyspark.statcounter.StatCounter.count" class="py-name" href="#" onclick="return doclink('link-4', 'count', 'link-4');">count</a></tt> <tt class="py-op">=</tt> <tt class="py-number">0</tt> </tt>
+<a name="L180"></a><tt class="py-lineno">180</tt> <tt class="py-line"> <tt class="py-keyword">for</tt> <tt class="py-name">item</tt> <tt class="py-keyword">in</tt> <tt class="py-name">iterator</tt><tt class="py-op">:</tt> </tt>
+<a name="L181"></a><tt class="py-lineno">181</tt> <tt class="py-line"> <tt class="py-name">items</tt><tt class="py-op">.</tt><tt class="py-name">append</tt><tt class="py-op">(</tt><tt class="py-name">item</tt><tt class="py-op">)</tt> </tt>
+<a name="L182"></a><tt class="py-lineno">182</tt> <tt class="py-line"> <tt id="link-5" class="py-name"><a title="pyspark.rdd.RDD.count
+pyspark.sql.SchemaRDD.count
+pyspark.statcounter.StatCounter.count" class="py-name" href="#" onclick="return doclink('link-5', 'count', 'link-4');">count</a></tt> <tt class="py-op">+=</tt> <tt class="py-number">1</tt> </tt>
+<a name="L183"></a><tt class="py-lineno">183</tt> <tt class="py-line"> <tt class="py-keyword">if</tt> <tt id="link-6" class="py-name"><a title="pyspark.rdd.RDD.count
+pyspark.sql.SchemaRDD.count
+pyspark.statcounter.StatCounter.count" class="py-name" href="#" onclick="return doclink('link-6', 'count', 'link-4');">count</a></tt> <tt class="py-op">==</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">batchSize</tt><tt class="py-op">:</tt> </tt>
+<a name="L184"></a><tt class="py-lineno">184</tt> <tt class="py-line"> <tt class="py-keyword">yield</tt> <tt class="py-name">items</tt> </tt>
+<a name="L185"></a><tt class="py-lineno">185</tt> <tt class="py-line"> <tt class="py-name">items</tt> <tt class="py-op">=</tt> <tt class="py-op">[</tt><tt class="py-op">]</tt> </tt>
+<a name="L186"></a><tt class="py-lineno">186</tt> <tt class="py-line"> <tt id="link-7" class="py-name"><a title="pyspark.rdd.RDD.count
+pyspark.sql.SchemaRDD.count
+pyspark.statcounter.StatCounter.count" class="py-name" href="#" onclick="return doclink('link-7', 'count', 'link-4');">count</a></tt> <tt class="py-op">=</tt> <tt class="py-number">0</tt> </tt>
+<a name="L187"></a><tt class="py-lineno">187</tt> <tt class="py-line"> <tt class="py-keyword">if</tt> <tt class="py-name">items</tt><tt class="py-op">:</tt> </tt>
+<a name="L188"></a><tt class="py-lineno">188</tt> <tt class="py-line"> <tt class="py-keyword">yield</tt> <tt class="py-name">items</tt> </tt>
+</div><a name="L189"></a><tt class="py-lineno">189</tt> <tt class="py-line"> </tt>
+<a name="BatchedSerializer.dump_stream"></a><div id="BatchedSerializer.dump_stream-def"><a name="L190"></a><tt class="py-lineno">190</tt> <a class="py-toggle" href="#" id="BatchedSerializer.dump_stream-toggle" onclick="return toggle('BatchedSerializer.dump_stream');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.BatchedSerializer-class.html#dump_stream">dump_stream</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">iterator</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="BatchedSerializer.dump_stream-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="BatchedSerializer.dump_stream-expanded"><a name="L191"></a><tt class="py-lineno">191</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">serializer</tt><tt class="py-op">.</tt><tt class="py-name">dump_stream</tt><tt class="py-op">(</tt><tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">_batched</tt><tt class="py-op">(</tt><tt class="py-name">iterator</tt><tt class="py-op">)</tt><tt class="py-op">,</tt> <tt class="py-name">stream</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L192"></a><tt class="py-lineno">192</tt> <tt class="py-line"> </tt>
+<a name="BatchedSerializer.load_stream"></a><div id="BatchedSerializer.load_stream-def"><a name="L193"></a><tt class="py-lineno">193</tt> <a class="py-toggle" href="#" id="BatchedSerializer.load_stream-toggle" onclick="return toggle('BatchedSerializer.load_stream');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.BatchedSerializer-class.html#load_stream">load_stream</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="BatchedSerializer.load_stream-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="BatchedSerializer.load_stream-expanded"><a name="L194"></a><tt class="py-lineno">194</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-name">chain</tt><tt class="py-op">.</tt><tt class="py-name">from_iterable</tt><tt class="py-op">(</tt><tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">_load_stream_without_unbatching</tt><tt class="py-op">(</tt><tt class="py-name">stream</tt><tt class="py-op">)</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L195"></a><tt class="py-lineno">195</tt> <tt class="py-line"> </tt>
+<a name="BatchedSerializer._load_stream_without_unbatching"></a><div id="BatchedSerializer._load_stream_without_unbatching-def"><a name="L196"></a><tt class="py-lineno">196</tt> <a class="py-toggle" href="#" id="BatchedSerializer._load_stream_without_unbatching-toggle" onclick="return toggle('BatchedSerializer._load_stream_without_unbatching');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.BatchedSerializer-class.html#_load_stream_without_unbatching">_load_stream_without_unbatching</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="BatchedSerializer._load_stream_without_unbatching-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="BatchedSerializer._load_stream_without_unbatching-expanded"><a name="L197"></a><tt class="py-lineno">197</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">serializer</tt><tt class="py-op">.</tt><tt class="py-name">load_stream</tt><tt class="py-op">(</tt><tt class="py-name">stream</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L198"></a><tt class="py-lineno">198</tt> <tt class="py-line"> </tt>
+<a name="BatchedSerializer.__eq__"></a><div id="BatchedSerializer.__eq__-def"><a name="L199"></a><tt class="py-lineno">199</tt> <a class="py-toggle" href="#" id="BatchedSerializer.__eq__-toggle" onclick="return toggle('BatchedSerializer.__eq__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.BatchedSerializer-class.html#__eq__">__eq__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">other</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="BatchedSerializer.__eq__-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="BatchedSerializer.__eq__-expanded"><a name="L200"></a><tt class="py-lineno">200</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-name">isinstance</tt><tt class="py-op">(</tt><tt class="py-name">other</tt><tt class="py-op">,</tt> <tt class="py-name">BatchedSerializer</tt><tt class="py-op">)</tt> <tt class="py-keyword">and</tt> \ </tt>
+<a name="L201"></a><tt class="py-lineno">201</tt> <tt class="py-line"> <tt class="py-name">other</tt><tt class="py-op">.</tt><tt class="py-name">serializer</tt> <tt class="py-op">==</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">serializer</tt> </tt>
+</div><a name="L202"></a><tt class="py-lineno">202</tt> <tt class="py-line"> </tt>
+<a name="BatchedSerializer.__str__"></a><div id="BatchedSerializer.__str__-def"><a name="L203"></a><tt class="py-lineno">203</tt> <a class="py-toggle" href="#" id="BatchedSerializer.__str__-toggle" onclick="return toggle('BatchedSerializer.__str__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.BatchedSerializer-class.html#__str__">__str__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="BatchedSerializer.__str__-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="BatchedSerializer.__str__-expanded"><a name="L204"></a><tt class="py-lineno">204</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-string">"BatchedSerializer&lt;%s&gt;"</tt> <tt class="py-op">%</tt> <tt class="py-name">str</tt><tt class="py-op">(</tt><tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">serializer</tt><tt class="py-op">)</tt> </tt>
+</div></div><a name="L205"></a><tt class="py-lineno">205</tt> <tt class="py-line"> </tt>
+<a name="L206"></a><tt class="py-lineno">206</tt> <tt class="py-line"> </tt>
+<a name="CartesianDeserializer"></a><div id="CartesianDeserializer-def"><a name="L207"></a><tt class="py-lineno">207</tt> <a class="py-toggle" href="#" id="CartesianDeserializer-toggle" onclick="return toggle('CartesianDeserializer');">-</a><tt class="py-line"><tt class="py-keyword">class</tt> <a class="py-def-name" href="pyspark.serializers.CartesianDeserializer-class.html">CartesianDeserializer</a><tt class="py-op">(</tt><tt class="py-base-class">FramedSerializer</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="CartesianDeserializer-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="CartesianDeserializer-expanded"><a name="L208"></a><tt class="py-lineno">208</tt> <tt class="py-line"> <tt class="py-docstring">"""</tt> </tt>
+<a name="L209"></a><tt class="py-lineno">209</tt> <tt class="py-line"><tt class="py-docstring"> Deserializes the JavaRDD cartesian() of two PythonRDDs.</tt> </tt>
+<a name="L210"></a><tt class="py-lineno">210</tt> <tt class="py-line"><tt class="py-docstring"> """</tt> </tt>
+<a name="L211"></a><tt class="py-lineno">211</tt> <tt class="py-line"> </tt>
+<a name="CartesianDeserializer.__init__"></a><div id="CartesianDeserializer.__init__-def"><a name="L212"></a><tt class="py-lineno">212</tt> <a class="py-toggle" href="#" id="CartesianDeserializer.__init__-toggle" onclick="return toggle('CartesianDeserializer.__init__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.CartesianDeserializer-class.html#__init__">__init__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">key_ser</tt><tt class="py-op">,</tt> <tt class="py-param">val_ser</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="CartesianDeserializer.__init__-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="CartesianDeserializer.__init__-expanded"><a name="L213"></a><tt class="py-lineno">213</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">key_ser</tt> <tt class="py-op">=</tt> <tt class="py-name">key_ser</tt> </tt>
+<a name="L214"></a><tt class="py-lineno">214</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">val_ser</tt> <tt class="py-op">=</tt> <tt class="py-name">val_ser</tt> </tt>
+</div><a name="L215"></a><tt class="py-lineno">215</tt> <tt class="py-line"> </tt>
+<a name="CartesianDeserializer.prepare_keys_values"></a><div id="CartesianDeserializer.prepare_keys_values-def"><a name="L216"></a><tt class="py-lineno">216</tt> <a class="py-toggle" href="#" id="CartesianDeserializer.prepare_keys_values-toggle" onclick="return toggle('CartesianDeserializer.prepare_keys_values');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.CartesianDeserializer-class.html#prepare_keys_values">prepare_keys_values</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="CartesianDeserializer.prepare_keys_values-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="CartesianDeserializer.prepare_keys_values-expanded"><a name="L217"></a><tt class="py-lineno">217</tt> <tt class="py-line"> <tt class="py-name">key_stream</tt> <tt class="py-op">=</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">key_ser</tt><tt class="py-op">.</tt><tt class="py-name">_load_stream_without_unbatching</tt><tt class="py-op">(</tt><tt class="py-name">stream</tt><tt class="py-op">)</tt> </tt>
+<a name="L218"></a><tt class="py-lineno">218</tt> <tt class="py-line"> <tt class="py-name">val_stream</tt> <tt class="py-op">=</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">val_ser</tt><tt class="py-op">.</tt><tt class="py-name">_load_stream_without_unbatching</tt><tt class="py-op">(</tt><tt class="py-name">stream</tt><tt class="py-op">)</tt> </tt>
+<a name="L219"></a><tt class="py-lineno">219</tt> <tt class="py-line"> <tt class="py-name">key_is_batched</tt> <tt class="py-op">=</tt> <tt class="py-name">isinstance</tt><tt class="py-op">(</tt><tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">key_ser</tt><tt class="py-op">,</tt> <tt class="py-name">BatchedSerializer</tt><tt class="py-op">)</tt> </tt>
+<a name="L220"></a><tt class="py-lineno">220</tt> <tt class="py-line"> <tt class="py-name">val_is_batched</tt> <tt class="py-op">=</tt> <tt class="py-name">isinstance</tt><tt class="py-op">(</tt><tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">val_ser</tt><tt class="py-op">,</tt> <tt class="py-name">BatchedSerializer</tt><tt class="py-op">)</tt> </tt>
+<a name="L221"></a><tt class="py-lineno">221</tt> <tt class="py-line"> <tt class="py-keyword">for</tt> <tt class="py-op">(</tt><tt id="link-8" class="py-name" targets="Method pyspark.rdd.RDD.keys()=pyspark.rdd.RDD-class.html#keys"><a title="pyspark.rdd.RDD.keys" class="py-name" href="#" onclick="return doclink('link-8', 'keys', 'link-8');">keys</a></tt><tt class="py-op">,</tt> <tt class="py-name">vals</tt><tt class="py-op">)</tt> <tt class="py-keyword">in</tt> <tt class="py-name">izip</tt><tt class="py-op">(</tt><tt class="py-name">key_stream</tt><tt class="py-op">,</tt> <tt class="py-name">val_stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+<a name="L222"></a><tt class="py-lineno">222</tt> <tt class="py-line"> <tt id="link-9" class="py-name"><a title="pyspark.rdd.RDD.keys" class="py-name" href="#" onclick="return doclink('link-9', 'keys', 'link-8');">keys</a></tt> <tt class="py-op">=</tt> <tt id="link-10" class="py-name"><a title="pyspark.rdd.RDD.keys" class="py-name" href="#" onclick="return doclink('link-10', 'keys', 'link-8');">keys</a></tt> <tt class="py-keyword">if</tt> <tt class="py-name">key_is_batched</tt> <tt class="py-keyword">else</tt> <tt class="py-op">[</tt><tt id="link-11" class="py-name"><a title="pyspark.rdd.RDD.keys" class="py-name" href="#" onclick="return doclink('link-11', 'keys', 'link-8');">keys</a></tt><tt class="py-op">]</tt> </tt>
+<a name="L223"></a><tt class="py-lineno">223</tt> <tt class="py-line"> <tt class="py-name">vals</tt> <tt class="py-op">=</tt> <tt class="py-name">vals</tt> <tt class="py-keyword">if</tt> <tt class="py-name">val_is_batched</tt> <tt class="py-keyword">else</tt> <tt class="py-op">[</tt><tt class="py-name">vals</tt><tt class="py-op">]</tt> </tt>
+<a name="L224"></a><tt class="py-lineno">224</tt> <tt class="py-line"> <tt class="py-keyword">yield</tt> <tt class="py-op">(</tt><tt id="link-12" class="py-name"><a title="pyspark.rdd.RDD.keys" class="py-name" href="#" onclick="return doclink('link-12', 'keys', 'link-8');">keys</a></tt><tt class="py-op">,</tt> <tt class="py-name">vals</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L225"></a><tt class="py-lineno">225</tt> <tt class="py-line"> </tt>
+<a name="CartesianDeserializer.load_stream"></a><div id="CartesianDeserializer.load_stream-def"><a name="L226"></a><tt class="py-lineno">226</tt> <a class="py-toggle" href="#" id="CartesianDeserializer.load_stream-toggle" onclick="return toggle('CartesianDeserializer.load_stream');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.CartesianDeserializer-class.html#load_stream">load_stream</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="CartesianDeserializer.load_stream-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="CartesianDeserializer.load_stream-expanded"><a name="L227"></a><tt class="py-lineno">227</tt> <tt class="py-line"> <tt class="py-keyword">for</tt> <tt class="py-op">(</tt><tt id="link-13" class="py-name"><a title="pyspark.rdd.RDD.keys" class="py-name" href="#" onclick="return doclink('link-13', 'keys', 'link-8');">keys</a></tt><tt class="py-op">,</tt> <tt class="py-name">vals</tt><tt class="py-op">)</tt> <tt class="py-keyword">in</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">prepare_keys_values</tt><tt class="py-op">(</tt><tt class="py-name">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+<a name="L228"></a><tt class="py-lineno">228</tt> <tt class="py-line"> <tt class="py-keyword">for</tt> <tt class="py-name">pair</tt> <tt class="py-keyword">in</tt> <tt class="py-name">product</tt><tt class="py-op">(</tt><tt id="link-14" class="py-name"><a title="pyspark.rdd.RDD.keys" class="py-name" href="#" onclick="return doclink('link-14', 'keys', 'link-8');">keys</a></tt><tt class="py-op">,</tt> <tt class="py-name">vals</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+<a name="L229"></a><tt class="py-lineno">229</tt> <tt class="py-line"> <tt class="py-keyword">yield</tt> <tt class="py-name">pair</tt> </tt>
+</div><a name="L230"></a><tt class="py-lineno">230</tt> <tt class="py-line"> </tt>
+<a name="CartesianDeserializer.__eq__"></a><div id="CartesianDeserializer.__eq__-def"><a name="L231"></a><tt class="py-lineno">231</tt> <a class="py-toggle" href="#" id="CartesianDeserializer.__eq__-toggle" onclick="return toggle('CartesianDeserializer.__eq__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.CartesianDeserializer-class.html#__eq__">__eq__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">other</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="CartesianDeserializer.__eq__-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="CartesianDeserializer.__eq__-expanded"><a name="L232"></a><tt class="py-lineno">232</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-name">isinstance</tt><tt class="py-op">(</tt><tt class="py-name">other</tt><tt class="py-op">,</tt> <tt class="py-name">CartesianDeserializer</tt><tt class="py-op">)</tt> <tt class="py-keyword">and</tt> \ </tt>
+<a name="L233"></a><tt class="py-lineno">233</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">key_ser</tt> <tt class="py-op">==</tt> <tt class="py-name">other</tt><tt class="py-op">.</tt><tt class="py-name">key_ser</tt> <tt class="py-keyword">and</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">val_ser</tt> <tt class="py-op">==</tt> <tt class="py-name">other</tt><tt class="py-op">.</tt><tt class="py-name">val_ser</tt> </tt>
+</div><a name="L234"></a><tt class="py-lineno">234</tt> <tt class="py-line"> </tt>
+<a name="CartesianDeserializer.__str__"></a><div id="CartesianDeserializer.__str__-def"><a name="L235"></a><tt class="py-lineno">235</tt> <a class="py-toggle" href="#" id="CartesianDeserializer.__str__-toggle" onclick="return toggle('CartesianDeserializer.__str__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.CartesianDeserializer-class.html#__str__">__str__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="CartesianDeserializer.__str__-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="CartesianDeserializer.__str__-expanded"><a name="L236"></a><tt class="py-lineno">236</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-string">"CartesianDeserializer&lt;%s, %s&gt;"</tt> <tt class="py-op">%</tt> \ </tt>
+<a name="L237"></a><tt class="py-lineno">237</tt> <tt class="py-line"> <tt class="py-op">(</tt><tt class="py-name">str</tt><tt class="py-op">(</tt><tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">key_ser</tt><tt class="py-op">)</tt><tt class="py-op">,</tt> <tt class="py-name">str</tt><tt class="py-op">(</tt><tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">val_ser</tt><tt class="py-op">)</tt><tt class="py-op">)</tt> </tt>
+</div></div><a name="L238"></a><tt class="py-lineno">238</tt> <tt class="py-line"> </tt>
+<a name="L239"></a><tt class="py-lineno">239</tt> <tt class="py-line"> </tt>
+<a name="PairDeserializer"></a><div id="PairDeserializer-def"><a name="L240"></a><tt class="py-lineno">240</tt> <a class="py-toggle" href="#" id="PairDeserializer-toggle" onclick="return toggle('PairDeserializer');">-</a><tt class="py-line"><tt class="py-keyword">class</tt> <a class="py-def-name" href="pyspark.serializers.PairDeserializer-class.html">PairDeserializer</a><tt class="py-op">(</tt><tt class="py-base-class">CartesianDeserializer</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="PairDeserializer-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="PairDeserializer-expanded"><a name="L241"></a><tt class="py-lineno">241</tt> <tt class="py-line"> <tt class="py-docstring">"""</tt> </tt>
+<a name="L242"></a><tt class="py-lineno">242</tt> <tt class="py-line"><tt class="py-docstring"> Deserializes the JavaRDD zip() of two PythonRDDs.</tt> </tt>
+<a name="L243"></a><tt class="py-lineno">243</tt> <tt class="py-line"><tt class="py-docstring"> """</tt> </tt>
+<a name="L244"></a><tt class="py-lineno">244</tt> <tt class="py-line"> </tt>
+<a name="PairDeserializer.__init__"></a><div id="PairDeserializer.__init__-def"><a name="L245"></a><tt class="py-lineno">245</tt> <a class="py-toggle" href="#" id="PairDeserializer.__init__-toggle" onclick="return toggle('PairDeserializer.__init__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.PairDeserializer-class.html#__init__">__init__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">key_ser</tt><tt class="py-op">,</tt> <tt class="py-param">val_ser</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="PairDeserializer.__init__-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="PairDeserializer.__init__-expanded"><a name="L246"></a><tt class="py-lineno">246</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">key_ser</tt> <tt class="py-op">=</tt> <tt class="py-name">key_ser</tt> </tt>
+<a name="L247"></a><tt class="py-lineno">247</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">val_ser</tt> <tt class="py-op">=</tt> <tt class="py-name">val_ser</tt> </tt>
+</div><a name="L248"></a><tt class="py-lineno">248</tt> <tt class="py-line"> </tt>
+<a name="PairDeserializer.load_stream"></a><div id="PairDeserializer.load_stream-def"><a name="L249"></a><tt class="py-lineno">249</tt> <a class="py-toggle" href="#" id="PairDeserializer.load_stream-toggle" onclick="return toggle('PairDeserializer.load_stream');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.PairDeserializer-class.html#load_stream">load_stream</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="PairDeserializer.load_stream-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="PairDeserializer.load_stream-expanded"><a name="L250"></a><tt class="py-lineno">250</tt> <tt class="py-line"> <tt class="py-keyword">for</tt> <tt class="py-op">(</tt><tt id="link-15" class="py-name"><a title="pyspark.rdd.RDD.keys" class="py-name" href="#" onclick="return doclink('link-15', 'keys', 'link-8');">keys</a></tt><tt class="py-op">,</tt> <tt class="py-name">vals</tt><tt class="py-op">)</tt> <tt class="py-keyword">in</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">prepare_keys_values</tt><tt class="py-op">(</tt><tt class="py-name">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+<a name="L251"></a><tt class="py-lineno">251</tt> <tt class="py-line"> <tt class="py-keyword">for</tt> <tt class="py-name">pair</tt> <tt class="py-keyword">in</tt> <tt class="py-name">izip</tt><tt class="py-op">(</tt><tt id="link-16" class="py-name"><a title="pyspark.rdd.RDD.keys" class="py-name" href="#" onclick="return doclink('link-16', 'keys', 'link-8');">keys</a></tt><tt class="py-op">,</tt> <tt class="py-name">vals</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+<a name="L252"></a><tt class="py-lineno">252</tt> <tt class="py-line"> <tt class="py-keyword">yield</tt> <tt class="py-name">pair</tt> </tt>
+</div><a name="L253"></a><tt class="py-lineno">253</tt> <tt class="py-line"> </tt>
+<a name="PairDeserializer.__eq__"></a><div id="PairDeserializer.__eq__-def"><a name="L254"></a><tt class="py-lineno">254</tt> <a class="py-toggle" href="#" id="PairDeserializer.__eq__-toggle" onclick="return toggle('PairDeserializer.__eq__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.PairDeserializer-class.html#__eq__">__eq__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">other</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="PairDeserializer.__eq__-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="PairDeserializer.__eq__-expanded"><a name="L255"></a><tt class="py-lineno">255</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-name">isinstance</tt><tt class="py-op">(</tt><tt class="py-name">other</tt><tt class="py-op">,</tt> <tt class="py-name">PairDeserializer</tt><tt class="py-op">)</tt> <tt class="py-keyword">and</tt> \ </tt>
+<a name="L256"></a><tt class="py-lineno">256</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">key_ser</tt> <tt class="py-op">==</tt> <tt class="py-name">other</tt><tt class="py-op">.</tt><tt class="py-name">key_ser</tt> <tt class="py-keyword">and</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">val_ser</tt> <tt class="py-op">==</tt> <tt class="py-name">other</tt><tt class="py-op">.</tt><tt class="py-name">val_ser</tt> </tt>
+</div><a name="L257"></a><tt class="py-lineno">257</tt> <tt class="py-line"> </tt>
+<a name="PairDeserializer.__str__"></a><div id="PairDeserializer.__str__-def"><a name="L258"></a><tt class="py-lineno">258</tt> <a class="py-toggle" href="#" id="PairDeserializer.__str__-toggle" onclick="return toggle('PairDeserializer.__str__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.PairDeserializer-class.html#__str__">__str__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="PairDeserializer.__str__-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="PairDeserializer.__str__-expanded"><a name="L259"></a><tt class="py-lineno">259</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-string">"PairDeserializer&lt;%s, %s&gt;"</tt> <tt class="py-op">%</tt> \ </tt>
+<a name="L260"></a><tt class="py-lineno">260</tt> <tt class="py-line"> <tt class="py-op">(</tt><tt class="py-name">str</tt><tt class="py-op">(</tt><tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">key_ser</tt><tt class="py-op">)</tt><tt class="py-op">,</tt> <tt class="py-name">str</tt><tt class="py-op">(</tt><tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">val_ser</tt><tt class="py-op">)</tt><tt class="py-op">)</tt> </tt>
+</div></div><a name="L261"></a><tt class="py-lineno">261</tt> <tt class="py-line"> </tt>
+<a name="L262"></a><tt class="py-lineno">262</tt> <tt class="py-line"> </tt>
+<a name="NoOpSerializer"></a><div id="NoOpSerializer-def"><a name="L263"></a><tt class="py-lineno">263</tt> <a class="py-toggle" href="#" id="NoOpSerializer-toggle" onclick="return toggle('NoOpSerializer');">-</a><tt class="py-line"><tt class="py-keyword">class</tt> <a class="py-def-name" href="pyspark.serializers.NoOpSerializer-class.html">NoOpSerializer</a><tt class="py-op">(</tt><tt class="py-base-class">FramedSerializer</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="NoOpSerializer-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="NoOpSerializer-expanded"><a name="L264"></a><tt class="py-lineno">264</tt> <tt class="py-line"> </tt>
+<a name="NoOpSerializer.loads"></a><div id="NoOpSerializer.loads-def"><a name="L265"></a><tt class="py-lineno">265</tt> <a class="py-toggle" href="#" id="NoOpSerializer.loads-toggle" onclick="return toggle('NoOpSerializer.loads');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.NoOpSerializer-class.html#loads">loads</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">obj</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> <tt class="py-keyword">return</tt> <tt class="py-name">obj</tt> </tt>
+</div><a name="NoOpSerializer.dumps"></a><div id="NoOpSerializer.dumps-def"><a name="L266"></a><tt class="py-lineno">266</tt> <a class="py-toggle" href="#" id="NoOpSerializer.dumps-toggle" onclick="return toggle('NoOpSerializer.dumps');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.NoOpSerializer-class.html#dumps">dumps</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">obj</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> <tt class="py-keyword">return</tt> <tt class="py-name">obj</tt> </tt>
+</div></div><a name="L267"></a><tt class="py-lineno">267</tt> <tt class="py-line"> </tt>
+<a name="L268"></a><tt class="py-lineno">268</tt> <tt class="py-line"> </tt>
+<a name="PickleSerializer"></a><div id="PickleSerializer-def"><a name="L269"></a><tt class="py-lineno">269</tt> <a class="py-toggle" href="#" id="PickleSerializer-toggle" onclick="return toggle('PickleSerializer');">-</a><tt class="py-line"><tt class="py-keyword">class</tt> <a class="py-def-name" href="pyspark.serializers.PickleSerializer-class.html">PickleSerializer</a><tt class="py-op">(</tt><tt class="py-base-class">FramedSerializer</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="PickleSerializer-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="PickleSerializer-expanded"><a name="L270"></a><tt class="py-lineno">270</tt> <tt class="py-line"> <tt class="py-docstring">"""</tt> </tt>
+<a name="L271"></a><tt class="py-lineno">271</tt> <tt class="py-line"><tt class="py-docstring"> Serializes objects using Python's cPickle serializer:</tt> </tt>
+<a name="L272"></a><tt class="py-lineno">272</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
+<a name="L273"></a><tt class="py-lineno">273</tt> <tt class="py-line"><tt class="py-docstring"> http://docs.python.org/2/library/pickle.html</tt> </tt>
+<a name="L274"></a><tt class="py-lineno">274</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
+<a name="L275"></a><tt class="py-lineno">275</tt> <tt class="py-line"><tt class="py-docstring"> This serializer supports nearly any Python object, but may</tt> </tt>
+<a name="L276"></a><tt class="py-lineno">276</tt> <tt class="py-line"><tt class="py-docstring"> not be as fast as more specialized serializers.</tt> </tt>
+<a name="L277"></a><tt class="py-lineno">277</tt> <tt class="py-line"><tt class="py-docstring"> """</tt> </tt>
+<a name="L278"></a><tt class="py-lineno">278</tt> <tt class="py-line"> </tt>
+<a name="PickleSerializer.dumps"></a><div id="PickleSerializer.dumps-def"><a name="L279"></a><tt class="py-lineno">279</tt> <a class="py-toggle" href="#" id="PickleSerializer.dumps-toggle" onclick="return toggle('PickleSerializer.dumps');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.PickleSerializer-class.html#dumps">dumps</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">obj</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> <tt class="py-keyword">return</tt> <tt class="py-name">cPickle</tt><tt class="py-op">.</tt><tt id="link-17" class="py-name"><a title="pyspark.serializers.MarshalSerializer.dumps
+pyspark.serializers.PickleSerializer.dumps" class="py-name" href="#" onclick="return doclink('link-17', 'dumps', 'link-2');">dumps</a></tt><tt class="py-op">(</tt><tt class="py-name">obj</tt><tt class="py-op">,</tt> <tt class="py-number">2</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L280"></a><tt class="py-lineno">280</tt> <tt class="py-line"> <tt id="link-18" class="py-name"><a title="pyspark.serializers.MarshalSerializer.loads
+pyspark.serializers.PickleSerializer.loads" class="py-name" href="#" onclick="return doclink('link-18', 'loads', 'link-3');">loads</a></tt> <tt class="py-op">=</tt> <tt class="py-name">cPickle</tt><tt class="py-op">.</tt><tt id="link-19" class="py-name"><a title="pyspark.serializers.MarshalSerializer.loads
+pyspark.serializers.PickleSerializer.loads" class="py-name" href="#" onclick="return doclink('link-19', 'loads', 'link-3');">loads</a></tt> </tt>
+</div><a name="L281"></a><tt class="py-lineno">281</tt> <tt class="py-line"> </tt>
+<a name="CloudPickleSerializer"></a><div id="CloudPickleSerializer-def"><a name="L282"></a><tt class="py-lineno">282</tt> <a class="py-toggle" href="#" id="CloudPickleSerializer-toggle" onclick="return toggle('CloudPickleSerializer');">-</a><tt class="py-line"><tt class="py-keyword">class</tt> <a class="py-def-name" href="pyspark.serializers.CloudPickleSerializer-class.html">CloudPickleSerializer</a><tt class="py-op">(</tt><tt class="py-base-class">PickleSerializer</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="CloudPickleSerializer-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="CloudPickleSerializer-expanded"><a name="L283"></a><tt class="py-lineno">283</tt> <tt class="py-line"> </tt>
+<a name="CloudPickleSerializer.dumps"></a><div id="CloudPickleSerializer.dumps-def"><a name="L284"></a><tt class="py-lineno">284</tt> <a class="py-toggle" href="#" id="CloudPickleSerializer.dumps-toggle" onclick="return toggle('CloudPickleSerializer.dumps');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.CloudPickleSerializer-class.html#dumps">dumps</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">obj</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> <tt class="py-keyword">return</tt> <tt class="py-name">cloudpickle</tt><tt class="py-op">.</tt><tt id="link-20" class="py-name"><a title="pyspark.serializers.MarshalSerializer.dumps
+pyspark.serializers.PickleSerializer.dumps" class="py-name" href="#" onclick="return doclink('link-20', 'dumps', 'link-2');">dumps</a></tt><tt class="py-op">(</tt><tt class="py-name">obj</tt><tt class="py-op">,</tt> <tt class="py-number">2</tt><tt class="py-op">)</tt> </tt>
+</div></div><a name="L285"></a><tt class="py-lineno">285</tt> <tt class="py-line"> </tt>
+<a name="L286"></a><tt class="py-lineno">286</tt> <tt class="py-line"> </tt>
+<a name="MarshalSerializer"></a><div id="MarshalSerializer-def"><a name="L287"></a><tt class="py-lineno">287</tt> <a class="py-toggle" href="#" id="MarshalSerializer-toggle" onclick="return toggle('MarshalSerializer');">-</a><tt class="py-line"><tt class="py-keyword">class</tt> <a class="py-def-name" href="pyspark.serializers.MarshalSerializer-class.html">MarshalSerializer</a><tt class="py-op">(</tt><tt class="py-base-class">FramedSerializer</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="MarshalSerializer-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="MarshalSerializer-expanded"><a name="L288"></a><tt class="py-lineno">288</tt> <tt class="py-line"> <tt class="py-docstring">"""</tt> </tt>
+<a name="L289"></a><tt class="py-lineno">289</tt> <tt class="py-line"><tt class="py-docstring"> Serializes objects using Python's Marshal serializer:</tt> </tt>
+<a name="L290"></a><tt class="py-lineno">290</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
+<a name="L291"></a><tt class="py-lineno">291</tt> <tt class="py-line"><tt class="py-docstring"> http://docs.python.org/2/library/marshal.html</tt> </tt>
+<a name="L292"></a><tt class="py-lineno">292</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
+<a name="L293"></a><tt class="py-lineno">293</tt> <tt class="py-line"><tt class="py-docstring"> This serializer is faster than PickleSerializer but supports fewer datatypes.</tt> </tt>
+<a name="L294"></a><tt class="py-lineno">294</tt> <tt class="py-line"><tt class="py-docstring"> """</tt> </tt>
+<a name="L295"></a><tt class="py-lineno">295</tt> <tt class="py-line"> </tt>
+<a name="L296"></a><tt class="py-lineno">296</tt> <tt class="py-line"> <tt id="link-21" class="py-name"><a title="pyspark.serializers.MarshalSerializer.dumps
+pyspark.serializers.PickleSerializer.dumps" class="py-name" href="#" onclick="return doclink('link-21', 'dumps', 'link-2');">dumps</a></tt> <tt class="py-op">=</tt> <tt class="py-name">marshal</tt><tt class="py-op">.</tt><tt id="link-22" class="py-name"><a title="pyspark.serializers.MarshalSerializer.dumps
+pyspark.serializers.PickleSerializer.dumps" class="py-name" href="#" onclick="return doclink('link-22', 'dumps', 'link-2');">dumps</a></tt> </tt>
+<a name="L297"></a><tt class="py-lineno">297</tt> <tt class="py-line"> <tt id="link-23" class="py-name"><a title="pyspark.serializers.MarshalSerializer.loads
+pyspark.serializers.PickleSerializer.loads" class="py-name" href="#" onclick="return doclink('link-23', 'loads', 'link-3');">loads</a></tt> <tt class="py-op">=</tt> <tt class="py-name">marshal</tt><tt class="py-op">.</tt><tt id="link-24" class="py-name"><a title="pyspark.serializers.MarshalSerializer.loads
+pyspark.serializers.PickleSerializer.loads" class="py-name" href="#" onclick="return doclink('link-24', 'loads', 'link-3');">loads</a></tt> </tt>
+</div><a name="L298"></a><tt class="py-lineno">298</tt> <tt class="py-line"> </tt>
+<a name="L299"></a><tt class="py-lineno">299</tt> <tt class="py-line"> </tt>
+<a name="UTF8Deserializer"></a><div id="UTF8Deserializer-def"><a name="L300"></a><tt class="py-lineno">300</tt> <a class="py-toggle" href="#" id="UTF8Deserializer-toggle" onclick="return toggle('UTF8Deserializer');">-</a><tt class="py-line"><tt class="py-keyword">class</tt> <a class="py-def-name" href="pyspark.serializers.UTF8Deserializer-class.html">UTF8Deserializer</a><tt class="py-op">(</tt><tt class="py-base-class">Serializer</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="UTF8Deserializer-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="UTF8Deserializer-expanded"><a name="L301"></a><tt class="py-lineno">301</tt> <tt class="py-line"> <tt class="py-docstring">"""</tt> </tt>
+<a name="L302"></a><tt class="py-lineno">302</tt> <tt class="py-line"><tt class="py-docstring"> Deserializes streams written by String.getBytes.</tt> </tt>
+<a name="L303"></a><tt class="py-lineno">303</tt> <tt class="py-line"><tt class="py-docstring"> """</tt> </tt>
+<a name="L304"></a><tt class="py-lineno">304</tt> <tt class="py-line"> </tt>
+<a name="UTF8Deserializer.loads"></a><div id="UTF8Deserializer.loads-def"><a name="L305"></a><tt class="py-lineno">305</tt> <a class="py-toggle" href="#" id="UTF8Deserializer.loads-toggle" onclick="return toggle('UTF8Deserializer.loads');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.UTF8Deserializer-class.html#loads">loads</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="UTF8Deserializer.loads-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="UTF8Deserializer.loads-expanded"><a name="L306"></a><tt class="py-lineno">306</tt> <tt class="py-line"> <tt class="py-name">length</tt> <tt class="py-op">=</tt> <tt class="py-name">read_int</tt><tt class="py-op">(</tt><tt class="py-name">stream</tt><tt class="py-op">)</tt> </tt>
+<a name="L307"></a><tt class="py-lineno">307</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-name">stream</tt><tt class="py-op">.</tt><tt class="py-name">read</tt><tt class="py-op">(</tt><tt class="py-name">length</tt><tt class="py-op">)</tt><tt class="py-op">.</tt><tt class="py-name">decode</tt><tt class="py-op">(</tt><tt class="py-string">'utf8'</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L308"></a><tt class="py-lineno">308</tt> <tt class="py-line"> </tt>
+<a name="UTF8Deserializer.load_stream"></a><div id="UTF8Deserializer.load_stream-def"><a name="L309"></a><tt class="py-lineno">309</tt> <a class="py-toggle" href="#" id="UTF8Deserializer.load_stream-toggle" onclick="return toggle('UTF8Deserializer.load_stream');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers.UTF8Deserializer-class.html#load_stream">load_stream</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="UTF8Deserializer.load_stream-collapsed" style="display:none;" pad="+++" indent="++++++++"></div><div id="UTF8Deserializer.load_stream-expanded"><a name="L310"></a><tt class="py-lineno">310</tt> <tt class="py-line"> <tt class="py-keyword">while</tt> <tt class="py-name">True</tt><tt class="py-op">:</tt> </tt>
+<a name="L311"></a><tt class="py-lineno">311</tt> <tt class="py-line"> <tt class="py-keyword">try</tt><tt class="py-op">:</tt> </tt>
+<a name="L312"></a><tt class="py-lineno">312</tt> <tt class="py-line"> <tt class="py-keyword">yield</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt id="link-25" class="py-name"><a title="pyspark.serializers.MarshalSerializer.loads
+pyspark.serializers.PickleSerializer.loads" class="py-name" href="#" onclick="return doclink('link-25', 'loads', 'link-3');">loads</a></tt><tt class="py-op">(</tt><tt class="py-name">stream</tt><tt class="py-op">)</tt> </tt>
+<a name="L313"></a><tt class="py-lineno">313</tt> <tt class="py-line"> <tt class="py-keyword">except</tt> <tt class="py-name">struct</tt><tt class="py-op">.</tt><tt class="py-name">error</tt><tt class="py-op">:</tt> </tt>
+<a name="L314"></a><tt class="py-lineno">314</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> </tt>
+<a name="L315"></a><tt class="py-lineno">315</tt> <tt class="py-line"> <tt class="py-keyword">except</tt> <tt class="py-name">EOFError</tt><tt class="py-op">:</tt> </tt>
+<a name="L316"></a><tt class="py-lineno">316</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> </tt>
+</div></div><a name="L317"></a><tt class="py-lineno">317</tt> <tt class="py-line"> </tt>
+<a name="L318"></a><tt class="py-lineno">318</tt> <tt class="py-line"> </tt>
+<a name="read_long"></a><div id="read_long-def"><a name="L319"></a><tt class="py-lineno">319</tt> <a class="py-toggle" href="#" id="read_long-toggle" onclick="return toggle('read_long');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers-module.html#read_long">read_long</a><tt class="py-op">(</tt><tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="read_long-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="read_long-expanded"><a name="L320"></a><tt class="py-lineno">320</tt> <tt class="py-line"> <tt class="py-name">length</tt> <tt class="py-op">=</tt> <tt class="py-name">stream</tt><tt class="py-op">.</tt><tt class="py-name">read</tt><tt class="py-op">(</tt><tt class="py-number">8</tt><tt class="py-op">)</tt> </tt>
+<a name="L321"></a><tt class="py-lineno">321</tt> <tt class="py-line"> <tt class="py-keyword">if</tt> <tt class="py-name">length</tt> <tt class="py-op">==</tt> <tt class="py-string">""</tt><tt class="py-op">:</tt> </tt>
+<a name="L322"></a><tt class="py-lineno">322</tt> <tt class="py-line"> <tt class="py-keyword">raise</tt> <tt class="py-name">EOFError</tt> </tt>
+<a name="L323"></a><tt class="py-lineno">323</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-name">struct</tt><tt class="py-op">.</tt><tt class="py-name">unpack</tt><tt class="py-op">(</tt><tt class="py-string">"!q"</tt><tt class="py-op">,</tt> <tt class="py-name">length</tt><tt class="py-op">)</tt><tt class="py-op">[</tt><tt class="py-number">0</tt><tt class="py-op">]</tt> </tt>
+</div><a name="L324"></a><tt class="py-lineno">324</tt> <tt class="py-line"> </tt>
+<a name="L325"></a><tt class="py-lineno">325</tt> <tt class="py-line"> </tt>
+<a name="write_long"></a><div id="write_long-def"><a name="L326"></a><tt class="py-lineno">326</tt> <a class="py-toggle" href="#" id="write_long-toggle" onclick="return toggle('write_long');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers-module.html#write_long">write_long</a><tt class="py-op">(</tt><tt class="py-param">value</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="write_long-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="write_long-expanded"><a name="L327"></a><tt class="py-lineno">327</tt> <tt class="py-line"> <tt class="py-name">stream</tt><tt class="py-op">.</tt><tt class="py-name">write</tt><tt class="py-op">(</tt><tt class="py-name">struct</tt><tt class="py-op">.</tt><tt class="py-name">pack</tt><tt class="py-op">(</tt><tt class="py-string">"!q"</tt><tt class="py-op">,</tt> <tt id="link-26" class="py-name" targets="Method pyspark.accumulators.Accumulator.value()=pyspark.accumulators.Accumulator-class.html#value"><a title="pyspark.accumulators.Accumulator.value" class="py-name" href="#" onclick="return doclink('link-26', 'value', 'link-26');">value</a></tt><tt class="py-op">)</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L328"></a><tt class="py-lineno">328</tt> <tt class="py-line"> </tt>
+<a name="L329"></a><tt class="py-lineno">329</tt> <tt class="py-line"> </tt>
+<a name="pack_long"></a><div id="pack_long-def"><a name="L330"></a><tt class="py-lineno">330</tt> <a class="py-toggle" href="#" id="pack_long-toggle" onclick="return toggle('pack_long');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers-module.html#pack_long">pack_long</a><tt class="py-op">(</tt><tt class="py-param">value</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="pack_long-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="pack_long-expanded"><a name="L331"></a><tt class="py-lineno">331</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-name">struct</tt><tt class="py-op">.</tt><tt class="py-name">pack</tt><tt class="py-op">(</tt><tt class="py-string">"!q"</tt><tt class="py-op">,</tt> <tt id="link-27" class="py-name"><a title="pyspark.accumulators.Accumulator.value" class="py-name" href="#" onclick="return doclink('link-27', 'value', 'link-26');">value</a></tt><tt class="py-op">)</tt> </tt>
+</div><a name="L332"></a><tt class="py-lineno">332</tt> <tt class="py-line"> </tt>
+<a name="L333"></a><tt class="py-lineno">333</tt> <tt class="py-line"> </tt>
+<a name="read_int"></a><div id="read_int-def"><a name="L334"></a><tt class="py-lineno">334</tt> <a class="py-toggle" href="#" id="read_int-toggle" onclick="return toggle('read_int');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers-module.html#read_int">read_int</a><tt class="py-op">(</tt><tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="read_int-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="read_int-expanded"><a name="L335"></a><tt class="py-lineno">335</tt> <tt class="py-line"> <tt class="py-name">length</tt> <tt class="py-op">=</tt> <tt class="py-name">stream</tt><tt class="py-op">.</tt><tt class="py-name">read</tt><tt class="py-op">(</tt><tt class="py-number">4</tt><tt class="py-op">)</tt> </tt>
+<a name="L336"></a><tt class="py-lineno">336</tt> <tt class="py-line"> <tt class="py-keyword">if</tt> <tt class="py-name">length</tt> <tt class="py-op">==</tt> <tt class="py-string">""</tt><tt class="py-op">:</tt> </tt>
+<a name="L337"></a><tt class="py-lineno">337</tt> <tt class="py-line"> <tt class="py-keyword">raise</tt> <tt class="py-name">EOFError</tt> </tt>
+<a name="L338"></a><tt class="py-lineno">338</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-name">struct</tt><tt class="py-op">.</tt><tt class="py-name">unpack</tt><tt class="py-op">(</tt><tt class="py-string">"!i"</tt><tt class="py-op">,</tt> <tt class="py-name">length</tt><tt class="py-op">)</tt><tt class="py-op">[</tt><tt class="py-number">0</tt><tt class="py-op">]</tt> </tt>
+</div><a name="L339"></a><tt class="py-lineno">339</tt> <tt class="py-line"> </tt>
+<a name="L340"></a><tt class="py-lineno">340</tt> <tt class="py-line"> </tt>
+<a name="write_int"></a><div id="write_int-def"><a name="L341"></a><tt class="py-lineno">341</tt> <a class="py-toggle" href="#" id="write_int-toggle" onclick="return toggle('write_int');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers-module.html#write_int">write_int</a><tt class="py-op">(</tt><tt class="py-param">value</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="write_int-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="write_int-expanded"><a name="L342"></a><tt class="py-lineno">342</tt> <tt class="py-line"> <tt class="py-name">stream</tt><tt class="py-op">.</tt><tt class="py-name">write</tt><tt class="py-op">(</tt><tt class="py-name">struct</tt><tt class="py-op">.</tt><tt class="py-name">pack</tt><tt class="py-op">(</tt><tt class="py-string">"!i"</tt><tt class="py-op">,</tt> <tt id="link-28" class="py-name"><a title="pyspark.accumulators.Accumulator.value" class="py-name" href="#" onclick="return doclink('link-28', 'value', 'link-26');">value</a></tt><tt class="py-op">)</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L343"></a><tt class="py-lineno">343</tt> <tt class="py-line"> </tt>
+<a name="L344"></a><tt class="py-lineno">344</tt> <tt class="py-line"> </tt>
+<a name="write_with_length"></a><div id="write_with_length-def"><a name="L345"></a><tt class="py-lineno">345</tt> <a class="py-toggle" href="#" id="write_with_length-toggle" onclick="return toggle('write_with_length');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.serializers-module.html#write_with_length">write_with_length</a><tt class="py-op">(</tt><tt class="py-param">obj</tt><tt class="py-op">,</tt> <tt class="py-param">stream</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
+</div><div id="write_with_length-collapsed" style="display:none;" pad="+++" indent="++++"></div><div id="write_with_length-expanded"><a name="L346"></a><tt class="py-lineno">346</tt> <tt class="py-line"> <tt class="py-name">write_int</tt><tt class="py-op">(</tt><tt class="py-name">len</tt><tt class="py-op">(</tt><tt class="py-name">obj</tt><tt class="py-op">)</tt><tt class="py-op">,</tt> <tt class="py-name">stream</tt><tt class="py-op">)</tt> </tt>
+<a name="L347"></a><tt class="py-lineno">347</tt> <tt class="py-line"> <tt class="py-name">stream</tt><tt class="py-op">.</tt><tt class="py-name">write</tt><tt class="py-op">(</tt><tt class="py-name">obj</tt><tt class="py-op">)</tt> </tt>
+</div><a name="L348"></a><tt class="py-lineno">348</tt> <tt class="py-line"> </tt><script type="text/javascript">
+<!--
+expandto(location.href);
+// -->
+</script>
+</pre>
+<br />
+<!-- ==================== NAVIGATION BAR ==================== -->
+<table class="navbar" border="0" width="100%" cellpadding="0"
+ bgcolor="#a0c0ff" cellspacing="0">
+ <tr valign="middle">
+ <!-- Home link -->
+ <th>&nbsp;&nbsp;&nbsp;<a
+ href="pyspark-module.html">Home</a>&nbsp;&nbsp;&nbsp;</th>
+
+ <!-- Tree link -->
+ <th>&nbsp;&nbsp;&nbsp;<a
+ href="module-tree.html">Trees</a>&nbsp;&nbsp;&nbsp;</th>
+
+ <!-- Index link -->
+ <th>&nbsp;&nbsp;&nbsp;<a
+ href="identifier-index.html">Indices</a>&nbsp;&nbsp;&nbsp;</th>
+
+ <!-- Help link -->
+ <th>&nbsp;&nbsp;&nbsp;<a
+ href="help.html">Help</a>&nbsp;&nbsp;&nbsp;</th>
+
+ <!-- Project homepage -->
+ <th class="navbar" align="right" width="100%">
+ <table border="0" cellpadding="0" cellspacing="0">
+ <tr><th class="navbar" align="center"
+ ><a class="navbar" target="_top" href="http://spark.apache.org">Spark 1.0.0 Python API Docs</a></th>
+ </tr></table></th>
+ </tr>
+</table>
+<table border="0" cellpadding="0" cellspacing="0" width="100%%">
+ <tr>
+ <td align="left" class="footer">
+ Generated by Epydoc 3.0.1 on Fri Jul 4 18:52:26 2014
+ </td>
+ <td align="right" class="footer">
+ <a target="mainFrame" href="http://epydoc.sourceforge.net"
+ >http://epydoc.sourceforge.net</a>
+ </td>
+ </tr>
+</table>
+
+<script type="text/javascript">
+ <!--
+ // Private objects are initially displayed (because if
+ // javascript is turned off then we want them to be
+ // visible); but by default, we want to hide them. So hide
+ // them unless we have a cookie that says to show them.
+ checkCookie();
+ // -->
+</script>
+</body>
+</html>