aboutsummaryrefslogtreecommitdiff
path: root/examples/src/main/python/pagerank.py
diff options
context:
space:
mode:
Diffstat (limited to 'examples/src/main/python/pagerank.py')
-rwxr-xr-xexamples/src/main/python/pagerank.py12
1 files changed, 6 insertions, 6 deletions
diff --git a/examples/src/main/python/pagerank.py b/examples/src/main/python/pagerank.py
index d350fa46fa..0b96343158 100755
--- a/examples/src/main/python/pagerank.py
+++ b/examples/src/main/python/pagerank.py
@@ -15,9 +15,8 @@
# limitations under the License.
#
-#!/usr/bin/env python
-
-import re, sys
+import re
+import sys
from operator import add
from pyspark import SparkContext
@@ -26,7 +25,8 @@ from pyspark import SparkContext
def computeContribs(urls, rank):
"""Calculates URL contributions to the rank of other URLs."""
num_urls = len(urls)
- for url in urls: yield (url, rank / num_urls)
+ for url in urls:
+ yield (url, rank / num_urls)
def parseNeighbors(urls):
@@ -59,8 +59,8 @@ if __name__ == "__main__":
# Calculates and updates URL ranks continuously using PageRank algorithm.
for iteration in xrange(int(sys.argv[2])):
# Calculates URL contributions to the rank of other URLs.
- contribs = links.join(ranks).flatMap(lambda (url, (urls, rank)):
- computeContribs(urls, rank))
+ contribs = links.join(ranks).flatMap(
+ lambda (url, (urls, rank)): computeContribs(urls, rank))
# Re-calculates URL ranks based on neighbor contributions.
ranks = contribs.reduceByKey(add).mapValues(lambda rank: rank * 0.85 + 0.15)