From 0a5cacb9615d960c93bca8cc3f4ad2a599f94ec0 Mon Sep 17 00:00:00 2001 From: Tor Myklebust Date: Fri, 20 Dec 2013 02:05:15 -0500 Subject: Change some docstrings and add some others. --- python/pyspark/mllib.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) (limited to 'python') diff --git a/python/pyspark/mllib.py b/python/pyspark/mllib.py index ce1363fd17..928caa9e80 100644 --- a/python/pyspark/mllib.py +++ b/python/pyspark/mllib.py @@ -146,7 +146,7 @@ def _linear_predictor_typecheck(x, coeffs): raise TypeError("Argument of type " + type(x) + " unsupported"); class LinearModel(object): - """Something containing a vector of coefficients and an intercept.""" + """Something that has a vector of coefficients and an intercept.""" def __init__(self, coeff, intercept): self._coeff = coeff self._intercept = intercept @@ -305,6 +305,7 @@ class KMeansModel(object): self.centers = centers_ def predict(self, x): + """Find the cluster to which x belongs in this model.""" best = 0 best_distance = 1e75 for i in range(0, self.centers.shape[0]): @@ -318,6 +319,7 @@ class KMeansModel(object): @classmethod def train(cls, sc, data, k, maxIterations = 100, runs = 1, initialization_mode="k-means||"): + """Train a k-means clustering model.""" dataBytes = _get_unmangled_double_vector_rdd(data) ans = sc._jvm.PythonMLLibAPI().trainKMeansModel(dataBytes._jrdd, k, maxIterations, runs, initialization_mode) -- cgit v1.2.3