<?xml version="1.0" encoding="ascii"?>
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
"DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
<head>
<title>pyspark.mllib.recommendation</title>
<link rel="stylesheet" href="epydoc.css" type="text/css" />
<script type="text/javascript" src="epydoc.js"></script>
</head>
<body bgcolor="white" text="black" link="blue" vlink="#204080"
alink="#204080">
<!-- ==================== NAVIGATION BAR ==================== -->
<table class="navbar" border="0" width="100%" cellpadding="0"
bgcolor="#a0c0ff" cellspacing="0">
<tr valign="middle">
<!-- Home link -->
<th> <a
href="pyspark-module.html">Home</a> </th>
<!-- Tree link -->
<th> <a
href="module-tree.html">Trees</a> </th>
<!-- Index link -->
<th> <a
href="identifier-index.html">Indices</a> </th>
<!-- Help link -->
<th> <a
href="help.html">Help</a> </th>
<!-- Project homepage -->
<th class="navbar" align="right" width="100%">
<table border="0" cellpadding="0" cellspacing="0">
<tr><th class="navbar" align="center"
><a class="navbar" target="_top" href="http://spark.apache.org">Spark 1.0.0 Python API Docs</a></th>
</tr></table></th>
</tr>
</table>
<table width="100%" cellpadding="0" cellspacing="0">
<tr valign="top">
<td width="100%">
<span class="breadcrumbs">
<a href="pyspark-module.html">Package pyspark</a> ::
<a href="pyspark.mllib-module.html">Package mllib</a> ::
Module recommendation
</span>
</td>
<td>
<table cellpadding="0" cellspacing="0">
<!-- hide/show private -->
<tr><td align="right"><span class="options"
>[<a href="frames.html" target="_top">frames</a
>] | <a href="pyspark.mllib.recommendation-pysrc.html"
target="_top">no frames</a>]</span></td></tr>
</table>
</td>
</tr>
</table>
<h1 class="epydoc">Source Code for <a href="pyspark.mllib.recommendation-module.html">Module pyspark.mllib.recommendation</a></h1>
<pre class="py-src">
<a name="L1"></a><tt class="py-lineno"> 1</tt> <tt class="py-line"><tt class="py-comment">#</tt> </tt>
<a name="L2"></a><tt class="py-lineno"> 2</tt> <tt class="py-line"><tt class="py-comment"># Licensed to the Apache Software Foundation (ASF) under one or more</tt> </tt>
<a name="L3"></a><tt class="py-lineno"> 3</tt> <tt class="py-line"><tt class="py-comment"># contributor license agreements. See the NOTICE file distributed with</tt> </tt>
<a name="L4"></a><tt class="py-lineno"> 4</tt> <tt class="py-line"><tt class="py-comment"># this work for additional information regarding copyright ownership.</tt> </tt>
<a name="L5"></a><tt class="py-lineno"> 5</tt> <tt class="py-line"><tt class="py-comment"># The ASF licenses this file to You under the Apache License, Version 2.0</tt> </tt>
<a name="L6"></a><tt class="py-lineno"> 6</tt> <tt class="py-line"><tt class="py-comment"># (the "License"); you may not use this file except in compliance with</tt> </tt>
<a name="L7"></a><tt class="py-lineno"> 7</tt> <tt class="py-line"><tt class="py-comment"># the License. You may obtain a copy of the License at</tt> </tt>
<a name="L8"></a><tt class="py-lineno"> 8</tt> <tt class="py-line"><tt class="py-comment">#</tt> </tt>
<a name="L9"></a><tt class="py-lineno"> 9</tt> <tt class="py-line"><tt class="py-comment"># http://www.apache.org/licenses/LICENSE-2.0</tt> </tt>
<a name="L10"></a><tt class="py-lineno">10</tt> <tt class="py-line"><tt class="py-comment">#</tt> </tt>
<a name="L11"></a><tt class="py-lineno">11</tt> <tt class="py-line"><tt class="py-comment"># Unless required by applicable law or agreed to in writing, software</tt> </tt>
<a name="L12"></a><tt class="py-lineno">12</tt> <tt class="py-line"><tt class="py-comment"># distributed under the License is distributed on an "AS IS" BASIS,</tt> </tt>
<a name="L13"></a><tt class="py-lineno">13</tt> <tt class="py-line"><tt class="py-comment"># WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.</tt> </tt>
<a name="L14"></a><tt class="py-lineno">14</tt> <tt class="py-line"><tt class="py-comment"># See the License for the specific language governing permissions and</tt> </tt>
<a name="L15"></a><tt class="py-lineno">15</tt> <tt class="py-line"><tt class="py-comment"># limitations under the License.</tt> </tt>
<a name="L16"></a><tt class="py-lineno">16</tt> <tt class="py-line"><tt class="py-comment">#</tt> </tt>
<a name="L17"></a><tt class="py-lineno">17</tt> <tt class="py-line"> </tt>
<a name="L18"></a><tt class="py-lineno">18</tt> <tt class="py-line"><tt class="py-keyword">from</tt> <tt id="link-0" class="py-name" targets="Package pyspark=pyspark-module.html"><a title="pyspark" class="py-name" href="#" onclick="return doclink('link-0', 'pyspark', 'link-0');">pyspark</a></tt> <tt class="py-keyword">import</tt> <tt id="link-1" class="py-name" targets="Class pyspark.context.SparkContext=pyspark.context.SparkContext-class.html"><a title="pyspark.context.SparkContext" class="py-name" href="#" onclick="return doclink('link-1', 'SparkContext', 'link-1');">SparkContext</a></tt> </tt>
<a name="L19"></a><tt class="py-lineno">19</tt> <tt class="py-line"><tt class="py-keyword">from</tt> <tt id="link-2" class="py-name"><a title="pyspark" class="py-name" href="#" onclick="return doclink('link-2', 'pyspark', 'link-0');">pyspark</a></tt><tt class="py-op">.</tt><tt id="link-3" class="py-name" targets="Package pyspark.mllib=pyspark.mllib-module.html"><a title="pyspark.mllib" class="py-name" href="#" onclick="return doclink('link-3', 'mllib', 'link-3');">mllib</a></tt><tt class="py-op">.</tt><tt class="py-name">_common</tt> <tt class="py-keyword">import</tt> \ </tt>
<a name="L20"></a><tt class="py-lineno">20</tt> <tt class="py-line"> <tt class="py-name">_get_unmangled_rdd</tt><tt class="py-op">,</tt> <tt class="py-name">_get_unmangled_double_vector_rdd</tt><tt class="py-op">,</tt> \ </tt>
<a name="L21"></a><tt class="py-lineno">21</tt> <tt class="py-line"> <tt class="py-name">_serialize_double_matrix</tt><tt class="py-op">,</tt> <tt class="py-name">_deserialize_double_matrix</tt><tt class="py-op">,</tt> \ </tt>
<a name="L22"></a><tt class="py-lineno">22</tt> <tt class="py-line"> <tt class="py-name">_serialize_double_vector</tt><tt class="py-op">,</tt> <tt class="py-name">_deserialize_double_vector</tt><tt class="py-op">,</tt> \ </tt>
<a name="L23"></a><tt class="py-lineno">23</tt> <tt class="py-line"> <tt class="py-name">_get_initial_weights</tt><tt class="py-op">,</tt> <tt class="py-name">_serialize_rating</tt><tt class="py-op">,</tt> <tt class="py-name">_regression_train_wrapper</tt><tt class="py-op">,</tt> \ </tt>
<a name="L24"></a><tt class="py-lineno">24</tt> <tt class="py-line"> <tt class="py-name">_serialize_tuple</tt><tt class="py-op">,</tt> <tt class="py-name">RatingDeserializer</tt> </tt>
<a name="L25"></a><tt class="py-lineno">25</tt> <tt class="py-line"><tt class="py-keyword">from</tt> <tt id="link-4" class="py-name"><a title="pyspark" class="py-name" href="#" onclick="return doclink('link-4', 'pyspark', 'link-0');">pyspark</a></tt><tt class="py-op">.</tt><tt id="link-5" class="py-name" targets="Module pyspark.rdd=pyspark.rdd-module.html"><a title="pyspark.rdd" class="py-name" href="#" onclick="return doclink('link-5', 'rdd', 'link-5');">rdd</a></tt> <tt class="py-keyword">import</tt> <tt id="link-6" class="py-name" targets="Class pyspark.rdd.RDD=pyspark.rdd.RDD-class.html"><a title="pyspark.rdd.RDD" class="py-name" href="#" onclick="return doclink('link-6', 'RDD', 'link-6');">RDD</a></tt> </tt>
<a name="MatrixFactorizationModel"></a><div id="MatrixFactorizationModel-def"><a name="L26"></a><tt class="py-lineno">26</tt> <tt class="py-line"> </tt>
<a name="L27"></a><tt class="py-lineno">27</tt> <tt class="py-line"> </tt>
<a name="L28"></a><tt class="py-lineno">28</tt> <a class="py-toggle" href="#" id="MatrixFactorizationModel-toggle" onclick="return toggle('MatrixFactorizationModel');">-</a><tt class="py-line"><tt class="py-keyword">class</tt> <a class="py-def-name" href="pyspark.mllib.recommendation.MatrixFactorizationModel-class.html">MatrixFactorizationModel</a><tt class="py-op">(</tt><tt class="py-base-class">object</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
</div><div id="MatrixFactorizationModel-collapsed" style="display:none;" pad="++" indent="++++"></div><div id="MatrixFactorizationModel-expanded"><a name="L29"></a><tt class="py-lineno">29</tt> <tt class="py-line"> <tt class="py-docstring">"""A matrix factorisation model trained by regularized alternating</tt> </tt>
<a name="L30"></a><tt class="py-lineno">30</tt> <tt class="py-line"><tt class="py-docstring"> least-squares.</tt> </tt>
<a name="L31"></a><tt class="py-lineno">31</tt> <tt class="py-line"><tt class="py-docstring"></tt> </tt>
<a name="L32"></a><tt class="py-lineno">32</tt> <tt class="py-line"><tt class="py-docstring"> >>> r1 = (1, 1, 1.0)</tt> </tt>
<a name="L33"></a><tt class="py-lineno">33</tt> <tt class="py-line"><tt class="py-docstring"> >>> r2 = (1, 2, 2.0)</tt> </tt>
<a name="L34"></a><tt class="py-lineno">34</tt> <tt class="py-line"><tt class="py-docstring"> >>> r3 = (2, 1, 2.0)</tt> </tt>
<a name="L35"></a><tt class="py-lineno">35</tt> <tt class="py-line"><tt class="py-docstring"> >>> ratings = sc.parallelize([r1, r2, r3])</tt> </tt>
<a name="L36"></a><tt class="py-lineno">36</tt> <tt class="py-line"><tt class="py-docstring"> >>> model = ALS.trainImplicit(ratings, 1)</tt> </tt>
<a name="L37"></a><tt class="py-lineno">37</tt> <tt class="py-line"><tt class="py-docstring"> >>> model.predict(2,2) is not None</tt> </tt>
<a name="L38"></a><tt class="py-lineno">38</tt> <tt class="py-line"><tt class="py-docstring"> True</tt> </tt>
<a name="L39"></a><tt class="py-lineno">39</tt> <tt class="py-line"><tt class="py-docstring"> >>> testset = sc.parallelize([(1, 2), (1, 1)])</tt> </tt>
<a name="L40"></a><tt class="py-lineno">40</tt> <tt class="py-line"><tt class="py-docstring"> >>> model.predictAll(testset).count() == 2</tt> </tt>
<a name="L41"></a><tt class="py-lineno">41</tt> <tt class="py-line"><tt class="py-docstring"> True</tt> </tt>
<a name="L42"></a><tt class="py-lineno">42</tt> <tt class="py-line"><tt class="py-docstring"> """</tt> </tt>
<a name="L43"></a><tt class="py-lineno">43</tt> <tt class="py-line"> </tt>
<a name="MatrixFactorizationModel.__init__"></a><div id="MatrixFactorizationModel.__init__-def"><a name="L44"></a><tt class="py-lineno">44</tt> <a class="py-toggle" href="#" id="MatrixFactorizationModel.__init__-toggle" onclick="return toggle('MatrixFactorizationModel.__init__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.mllib.recommendation.MatrixFactorizationModel-class.html#__init__">__init__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">sc</tt><tt class="py-op">,</tt> <tt class="py-param">java_model</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
</div><div id="MatrixFactorizationModel.__init__-collapsed" style="display:none;" pad="++" indent="++++++++"></div><div id="MatrixFactorizationModel.__init__-expanded"><a name="L45"></a><tt class="py-lineno">45</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">_context</tt> <tt class="py-op">=</tt> <tt class="py-name">sc</tt> </tt>
<a name="L46"></a><tt class="py-lineno">46</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">_java_model</tt> <tt class="py-op">=</tt> <tt class="py-name">java_model</tt> </tt>
</div><a name="L47"></a><tt class="py-lineno">47</tt> <tt class="py-line"> </tt>
<a name="MatrixFactorizationModel.__del__"></a><div id="MatrixFactorizationModel.__del__-def"><a name="L48"></a><tt class="py-lineno">48</tt> <a class="py-toggle" href="#" id="MatrixFactorizationModel.__del__-toggle" onclick="return toggle('MatrixFactorizationModel.__del__');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.mllib.recommendation.MatrixFactorizationModel-class.html#__del__">__del__</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
</div><div id="MatrixFactorizationModel.__del__-collapsed" style="display:none;" pad="++" indent="++++++++"></div><div id="MatrixFactorizationModel.__del__-expanded"><a name="L49"></a><tt class="py-lineno">49</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">_context</tt><tt class="py-op">.</tt><tt id="link-7" class="py-name" targets="Variable pyspark.context.SparkContext._gateway=pyspark.context.SparkContext-class.html#_gateway"><a title="pyspark.context.SparkContext._gateway" class="py-name" href="#" onclick="return doclink('link-7', '_gateway', 'link-7');">_gateway</a></tt><tt class="py-op">.</tt><tt class="py-name">detach</tt><tt class="py-op">(</tt><tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">_java_model</tt><tt class="py-op">)</tt> </tt>
</div><a name="L50"></a><tt class="py-lineno">50</tt> <tt class="py-line"> </tt>
<a name="MatrixFactorizationModel.predict"></a><div id="MatrixFactorizationModel.predict-def"><a name="L51"></a><tt class="py-lineno">51</tt> <a class="py-toggle" href="#" id="MatrixFactorizationModel.predict-toggle" onclick="return toggle('MatrixFactorizationModel.predict');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.mllib.recommendation.MatrixFactorizationModel-class.html#predict">predict</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">user</tt><tt class="py-op">,</tt> <tt class="py-param">product</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
</div><div id="MatrixFactorizationModel.predict-collapsed" style="display:none;" pad="++" indent="++++++++"></div><div id="MatrixFactorizationModel.predict-expanded"><a name="L52"></a><tt class="py-lineno">52</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">_java_model</tt><tt class="py-op">.</tt><tt id="link-8" class="py-name" targets="Method pyspark.mllib.classification.LogisticRegressionModel.predict()=pyspark.mllib.classification.LogisticRegressionModel-class.html#predict,Method pyspark.mllib.classification.NaiveBayesModel.predict()=pyspark.mllib.classification.NaiveBayesModel-class.html#predict,Method pyspark.mllib.classification.SVMModel.predict()=pyspark.mllib.classification.SVMModel-class.html#predict,Method pyspark.mllib.clustering.KMeansModel.predict()=pyspark.mllib.clustering.KMeansModel-class.html#predict,Method pyspark.mllib.recommendation.MatrixFactorizationModel.predict()=pyspark.mllib.recommendation.MatrixFactorizationModel-class.html#predict,Method pyspark.mllib.regression.LinearRegressionModelBase.predict()=pyspark.mllib.regression.LinearRegressionModelBase-class.html#predict"><a title="pyspark.mllib.classification.LogisticRegressionModel.predict
pyspark.mllib.classification.NaiveBayesModel.predict
pyspark.mllib.classification.SVMModel.predict
pyspark.mllib.clustering.KMeansModel.predict
pyspark.mllib.recommendation.MatrixFactorizationModel.predict
pyspark.mllib.regression.LinearRegressionModelBase.predict" class="py-name" href="#" onclick="return doclink('link-8', 'predict', 'link-8');">predict</a></tt><tt class="py-op">(</tt><tt class="py-name">user</tt><tt class="py-op">,</tt> <tt class="py-name">product</tt><tt class="py-op">)</tt> </tt>
</div><a name="L53"></a><tt class="py-lineno">53</tt> <tt class="py-line"> </tt>
<a name="MatrixFactorizationModel.predictAll"></a><div id="MatrixFactorizationModel.predictAll-def"><a name="L54"></a><tt class="py-lineno">54</tt> <a class="py-toggle" href="#" id="MatrixFactorizationModel.predictAll-toggle" onclick="return toggle('MatrixFactorizationModel.predictAll');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.mllib.recommendation.MatrixFactorizationModel-class.html#predictAll">predictAll</a><tt class="py-op">(</tt><tt class="py-param">self</tt><tt class="py-op">,</tt> <tt class="py-param">usersProducts</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
</div><div id="MatrixFactorizationModel.predictAll-collapsed" style="display:none;" pad="++" indent="++++++++"></div><div id="MatrixFactorizationModel.predictAll-expanded"><a name="L55"></a><tt class="py-lineno">55</tt> <tt class="py-line"> <tt class="py-name">usersProductsJRDD</tt> <tt class="py-op">=</tt> <tt class="py-name">_get_unmangled_rdd</tt><tt class="py-op">(</tt><tt class="py-name">usersProducts</tt><tt class="py-op">,</tt> <tt class="py-name">_serialize_tuple</tt><tt class="py-op">)</tt> </tt>
<a name="L56"></a><tt class="py-lineno">56</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt id="link-9" class="py-name"><a title="pyspark.rdd.RDD" class="py-name" href="#" onclick="return doclink('link-9', 'RDD', 'link-6');">RDD</a></tt><tt class="py-op">(</tt><tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">_java_model</tt><tt class="py-op">.</tt><tt id="link-10" class="py-name"><a title="pyspark.mllib.classification.LogisticRegressionModel.predict
pyspark.mllib.classification.NaiveBayesModel.predict
pyspark.mllib.classification.SVMModel.predict
pyspark.mllib.clustering.KMeansModel.predict
pyspark.mllib.recommendation.MatrixFactorizationModel.predict
pyspark.mllib.regression.LinearRegressionModelBase.predict" class="py-name" href="#" onclick="return doclink('link-10', 'predict', 'link-8');">predict</a></tt><tt class="py-op">(</tt><tt class="py-name">usersProductsJRDD</tt><tt class="py-op">.</tt><tt class="py-name">_jrdd</tt><tt class="py-op">)</tt><tt class="py-op">,</tt> </tt>
<a name="L57"></a><tt class="py-lineno">57</tt> <tt class="py-line"> <tt class="py-name">self</tt><tt class="py-op">.</tt><tt class="py-name">_context</tt><tt class="py-op">,</tt> <tt class="py-name">RatingDeserializer</tt><tt class="py-op">(</tt><tt class="py-op">)</tt><tt class="py-op">)</tt> </tt>
</div></div><a name="L58"></a><tt class="py-lineno">58</tt> <tt class="py-line"> </tt>
<a name="ALS"></a><div id="ALS-def"><a name="L59"></a><tt class="py-lineno">59</tt> <tt class="py-line"> </tt>
<a name="L60"></a><tt class="py-lineno">60</tt> <a class="py-toggle" href="#" id="ALS-toggle" onclick="return toggle('ALS');">-</a><tt class="py-line"><tt class="py-keyword">class</tt> <a class="py-def-name" href="pyspark.mllib.recommendation.ALS-class.html">ALS</a><tt class="py-op">(</tt><tt class="py-base-class">object</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
</div><div id="ALS-collapsed" style="display:none;" pad="++" indent="++++"></div><div id="ALS-expanded"><a name="L61"></a><tt class="py-lineno">61</tt> <tt class="py-line"> <tt class="py-decorator">@</tt><tt class="py-decorator">classmethod</tt> </tt>
<a name="ALS.train"></a><div id="ALS.train-def"><a name="L62"></a><tt class="py-lineno">62</tt> <a class="py-toggle" href="#" id="ALS.train-toggle" onclick="return toggle('ALS.train');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.mllib.recommendation.ALS-class.html#train">train</a><tt class="py-op">(</tt><tt class="py-param">cls</tt><tt class="py-op">,</tt> <tt class="py-param">ratings</tt><tt class="py-op">,</tt> <tt class="py-param">rank</tt><tt class="py-op">,</tt> <tt class="py-param">iterations</tt><tt class="py-op">=</tt><tt class="py-number">5</tt><tt class="py-op">,</tt> <tt class="py-param">lambda_</tt><tt class="py-op">=</tt><tt class="py-number">0.01</tt><tt class="py-op">,</tt> <tt class="py-param">blocks</tt><tt class="py-op">=</tt><tt class="py-op">-</tt><tt class="py-number">1</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
</div><div id="ALS.train-collapsed" style="display:none;" pad="++" indent="++++++++"></div><div id="ALS.train-expanded"><a name="L63"></a><tt class="py-lineno">63</tt> <tt class="py-line"> <tt class="py-name">sc</tt> <tt class="py-op">=</tt> <tt class="py-name">ratings</tt><tt class="py-op">.</tt><tt id="link-11" class="py-name" targets="Module pyspark.context=pyspark.context-module.html,Method pyspark.rdd.RDD.context()=pyspark.rdd.RDD-class.html#context"><a title="pyspark.context
pyspark.rdd.RDD.context" class="py-name" href="#" onclick="return doclink('link-11', 'context', 'link-11');">context</a></tt> </tt>
<a name="L64"></a><tt class="py-lineno">64</tt> <tt class="py-line"> <tt class="py-name">ratingBytes</tt> <tt class="py-op">=</tt> <tt class="py-name">_get_unmangled_rdd</tt><tt class="py-op">(</tt><tt class="py-name">ratings</tt><tt class="py-op">,</tt> <tt class="py-name">_serialize_rating</tt><tt class="py-op">)</tt> </tt>
<a name="L65"></a><tt class="py-lineno">65</tt> <tt class="py-line"> <tt class="py-name">mod</tt> <tt class="py-op">=</tt> <tt class="py-name">sc</tt><tt class="py-op">.</tt><tt id="link-12" class="py-name" targets="Variable pyspark.context.SparkContext._jvm=pyspark.context.SparkContext-class.html#_jvm"><a title="pyspark.context.SparkContext._jvm" class="py-name" href="#" onclick="return doclink('link-12', '_jvm', 'link-12');">_jvm</a></tt><tt class="py-op">.</tt><tt class="py-name">PythonMLLibAPI</tt><tt class="py-op">(</tt><tt class="py-op">)</tt><tt class="py-op">.</tt><tt class="py-name">trainALSModel</tt><tt class="py-op">(</tt> </tt>
<a name="L66"></a><tt class="py-lineno">66</tt> <tt class="py-line"> <tt class="py-name">ratingBytes</tt><tt class="py-op">.</tt><tt class="py-name">_jrdd</tt><tt class="py-op">,</tt> <tt class="py-name">rank</tt><tt class="py-op">,</tt> <tt class="py-name">iterations</tt><tt class="py-op">,</tt> <tt class="py-name">lambda_</tt><tt class="py-op">,</tt> <tt class="py-name">blocks</tt><tt class="py-op">)</tt> </tt>
<a name="L67"></a><tt class="py-lineno">67</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt id="link-13" class="py-name" targets="Class pyspark.mllib.recommendation.MatrixFactorizationModel=pyspark.mllib.recommendation.MatrixFactorizationModel-class.html"><a title="pyspark.mllib.recommendation.MatrixFactorizationModel" class="py-name" href="#" onclick="return doclink('link-13', 'MatrixFactorizationModel', 'link-13');">MatrixFactorizationModel</a></tt><tt class="py-op">(</tt><tt class="py-name">sc</tt><tt class="py-op">,</tt> <tt class="py-name">mod</tt><tt class="py-op">)</tt> </tt>
</div><a name="L68"></a><tt class="py-lineno">68</tt> <tt class="py-line"> </tt>
<a name="L69"></a><tt class="py-lineno">69</tt> <tt class="py-line"> <tt class="py-decorator">@</tt><tt class="py-decorator">classmethod</tt> </tt>
<a name="ALS.trainImplicit"></a><div id="ALS.trainImplicit-def"><a name="L70"></a><tt class="py-lineno">70</tt> <a class="py-toggle" href="#" id="ALS.trainImplicit-toggle" onclick="return toggle('ALS.trainImplicit');">-</a><tt class="py-line"> <tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.mllib.recommendation.ALS-class.html#trainImplicit">trainImplicit</a><tt class="py-op">(</tt><tt class="py-param">cls</tt><tt class="py-op">,</tt> <tt class="py-param">ratings</tt><tt class="py-op">,</tt> <tt class="py-param">rank</tt><tt class="py-op">,</tt> <tt class="py-param">iterations</tt><tt class="py-op">=</tt><tt class="py-number">5</tt><tt class="py-op">,</tt> <tt class="py-param">lambda_</tt><tt class="py-op">=</tt><tt class="py-number">0.01</tt><tt class="py-op">,</tt> <tt class="py-param">blocks</tt><tt class="py-op">=</tt><tt class="py-op">-</tt><tt class="py-number">1</tt><tt class="py-op">,</tt> <tt class="py-param">alpha</tt><tt class="py-op">=</tt><tt class="py-number">0.01</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
</div><div id="ALS.trainImplicit-collapsed" style="display:none;" pad="++" indent="++++++++"></div><div id="ALS.trainImplicit-expanded"><a name="L71"></a><tt class="py-lineno">71</tt> <tt class="py-line"> <tt class="py-name">sc</tt> <tt class="py-op">=</tt> <tt class="py-name">ratings</tt><tt class="py-op">.</tt><tt id="link-14" class="py-name"><a title="pyspark.context
pyspark.rdd.RDD.context" class="py-name" href="#" onclick="return doclink('link-14', 'context', 'link-11');">context</a></tt> </tt>
<a name="L72"></a><tt class="py-lineno">72</tt> <tt class="py-line"> <tt class="py-name">ratingBytes</tt> <tt class="py-op">=</tt> <tt class="py-name">_get_unmangled_rdd</tt><tt class="py-op">(</tt><tt class="py-name">ratings</tt><tt class="py-op">,</tt> <tt class="py-name">_serialize_rating</tt><tt class="py-op">)</tt> </tt>
<a name="L73"></a><tt class="py-lineno">73</tt> <tt class="py-line"> <tt class="py-name">mod</tt> <tt class="py-op">=</tt> <tt class="py-name">sc</tt><tt class="py-op">.</tt><tt id="link-15" class="py-name"><a title="pyspark.context.SparkContext._jvm" class="py-name" href="#" onclick="return doclink('link-15', '_jvm', 'link-12');">_jvm</a></tt><tt class="py-op">.</tt><tt class="py-name">PythonMLLibAPI</tt><tt class="py-op">(</tt><tt class="py-op">)</tt><tt class="py-op">.</tt><tt class="py-name">trainImplicitALSModel</tt><tt class="py-op">(</tt> </tt>
<a name="L74"></a><tt class="py-lineno">74</tt> <tt class="py-line"> <tt class="py-name">ratingBytes</tt><tt class="py-op">.</tt><tt class="py-name">_jrdd</tt><tt class="py-op">,</tt> <tt class="py-name">rank</tt><tt class="py-op">,</tt> <tt class="py-name">iterations</tt><tt class="py-op">,</tt> <tt class="py-name">lambda_</tt><tt class="py-op">,</tt> <tt class="py-name">blocks</tt><tt class="py-op">,</tt> <tt class="py-name">alpha</tt><tt class="py-op">)</tt> </tt>
<a name="L75"></a><tt class="py-lineno">75</tt> <tt class="py-line"> <tt class="py-keyword">return</tt> <tt id="link-16" class="py-name"><a title="pyspark.mllib.recommendation.MatrixFactorizationModel" class="py-name" href="#" onclick="return doclink('link-16', 'MatrixFactorizationModel', 'link-13');">MatrixFactorizationModel</a></tt><tt class="py-op">(</tt><tt class="py-name">sc</tt><tt class="py-op">,</tt> <tt class="py-name">mod</tt><tt class="py-op">)</tt> </tt>
</div></div><a name="L76"></a><tt class="py-lineno">76</tt> <tt class="py-line"> </tt>
<a name="_test"></a><div id="_test-def"><a name="L77"></a><tt class="py-lineno">77</tt> <tt class="py-line"> </tt>
<a name="L78"></a><tt class="py-lineno">78</tt> <a class="py-toggle" href="#" id="_test-toggle" onclick="return toggle('_test');">-</a><tt class="py-line"><tt class="py-keyword">def</tt> <a class="py-def-name" href="pyspark.mllib.recommendation-module.html#_test">_test</a><tt class="py-op">(</tt><tt class="py-op">)</tt><tt class="py-op">:</tt> </tt>
</div><div id="_test-collapsed" style="display:none;" pad="++" indent="++++"></div><div id="_test-expanded"><a name="L79"></a><tt class="py-lineno">79</tt> <tt class="py-line"> <tt class="py-keyword">import</tt> <tt class="py-name">doctest</tt> </tt>
<a name="L80"></a><tt class="py-lineno">80</tt> <tt class="py-line"> <tt class="py-name">globs</tt> <tt class="py-op">=</tt> <tt class="py-name">globals</tt><tt class="py-op">(</tt><tt class="py-op">)</tt><tt class="py-op">.</tt><tt id="link-17" class="py-name" targets="Method pyspark.statcounter.StatCounter.copy()=pyspark.statcounter.StatCounter-class.html#copy"><a title="pyspark.statcounter.StatCounter.copy" class="py-name" href="#" onclick="return doclink('link-17', 'copy', 'link-17');">copy</a></tt><tt class="py-op">(</tt><tt class="py-op">)</tt> </tt>
<a name="L81"></a><tt class="py-lineno">81</tt> <tt class="py-line"> <tt class="py-name">globs</tt><tt class="py-op">[</tt><tt class="py-string">'sc'</tt><tt class="py-op">]</tt> <tt class="py-op">=</tt> <tt id="link-18" class="py-name"><a title="pyspark.context.SparkContext" class="py-name" href="#" onclick="return doclink('link-18', 'SparkContext', 'link-1');">SparkContext</a></tt><tt class="py-op">(</tt><tt class="py-string">'local[4]'</tt><tt class="py-op">,</tt> <tt class="py-string">'PythonTest'</tt><tt class="py-op">,</tt> <tt class="py-name">batchSize</tt><tt class="py-op">=</tt><tt class="py-number">2</tt><tt class="py-op">)</tt> </tt>
<a name="L82"></a><tt class="py-lineno">82</tt> <tt class="py-line"> <tt class="py-op">(</tt><tt class="py-name">failure_count</tt><tt class="py-op">,</tt> <tt class="py-name">test_count</tt><tt class="py-op">)</tt> <tt class="py-op">=</tt> <tt class="py-name">doctest</tt><tt class="py-op">.</tt><tt class="py-name">testmod</tt><tt class="py-op">(</tt><tt class="py-name">globs</tt><tt class="py-op">=</tt><tt class="py-name">globs</tt><tt class="py-op">,</tt> <tt class="py-name">optionflags</tt><tt class="py-op">=</tt><tt class="py-name">doctest</tt><tt class="py-op">.</tt><tt class="py-name">ELLIPSIS</tt><tt class="py-op">)</tt> </tt>
<a name="L83"></a><tt class="py-lineno">83</tt> <tt class="py-line"> <tt class="py-name">globs</tt><tt class="py-op">[</tt><tt class="py-string">'sc'</tt><tt class="py-op">]</tt><tt class="py-op">.</tt><tt id="link-19" class="py-name" targets="Method pyspark.context.SparkContext.stop()=pyspark.context.SparkContext-class.html#stop"><a title="pyspark.context.SparkContext.stop" class="py-name" href="#" onclick="return doclink('link-19', 'stop', 'link-19');">stop</a></tt><tt class="py-op">(</tt><tt class="py-op">)</tt> </tt>
<a name="L84"></a><tt class="py-lineno">84</tt> <tt class="py-line"> <tt class="py-keyword">if</tt> <tt class="py-name">failure_count</tt><tt class="py-op">:</tt> </tt>
<a name="L85"></a><tt class="py-lineno">85</tt> <tt class="py-line"> <tt class="py-name">exit</tt><tt class="py-op">(</tt><tt class="py-op">-</tt><tt class="py-number">1</tt><tt class="py-op">)</tt> </tt>
</div><a name="L86"></a><tt class="py-lineno">86</tt> <tt class="py-line"> </tt>
<a name="L87"></a><tt class="py-lineno">87</tt> <tt class="py-line"> </tt>
<a name="L88"></a><tt class="py-lineno">88</tt> <tt class="py-line"><tt class="py-keyword">if</tt> <tt class="py-name">__name__</tt> <tt class="py-op">==</tt> <tt class="py-string">"__main__"</tt><tt class="py-op">:</tt> </tt>
<a name="L89"></a><tt class="py-lineno">89</tt> <tt class="py-line"> <tt class="py-name">_test</tt><tt class="py-op">(</tt><tt class="py-op">)</tt> </tt>
<a name="L90"></a><tt class="py-lineno">90</tt> <tt class="py-line"> </tt><script type="text/javascript">
<!--
expandto(location.href);
// -->
</script>
</pre>
<br />
<!-- ==================== NAVIGATION BAR ==================== -->
<table class="navbar" border="0" width="100%" cellpadding="0"
bgcolor="#a0c0ff" cellspacing="0">
<tr valign="middle">
<!-- Home link -->
<th> <a
href="pyspark-module.html">Home</a> </th>
<!-- Tree link -->
<th> <a
href="module-tree.html">Trees</a> </th>
<!-- Index link -->
<th> <a
href="identifier-index.html">Indices</a> </th>
<!-- Help link -->
<th> <a
href="help.html">Help</a> </th>
<!-- Project homepage -->
<th class="navbar" align="right" width="100%">
<table border="0" cellpadding="0" cellspacing="0">
<tr><th class="navbar" align="center"
><a class="navbar" target="_top" href="http://spark.apache.org">Spark 1.0.0 Python API Docs</a></th>
</tr></table></th>
</tr>
</table>
<table border="0" cellpadding="0" cellspacing="0" width="100%%">
<tr>
<td align="left" class="footer">
Generated by Epydoc 3.0.1 on Fri May 30 01:48:46 2014
</td>
<td align="right" class="footer">
<a target="mainFrame" href="http://epydoc.sourceforge.net"
>http://epydoc.sourceforge.net</a>
</td>
</tr>
</table>
<script type="text/javascript">
<!--
// Private objects are initially displayed (because if
// javascript is turned off then we want them to be
// visible); but by default, we want to hide them. So hide
// them unless we have a cookie that says to show them.
checkCookie();
// -->
</script>
</body>
</html>