From 43ef1e52bfe359f0f051a607a8dc77cc3b269508 Mon Sep 17 00:00:00 2001 From: Xiangrui Meng Date: Mon, 21 Mar 2016 17:42:30 -0700 Subject: Revert "[SPARK-13019][DOCS] Replace example code in mllib-statistics.md using include_example" This reverts commit 1af8de200c4d3357bcb09e7bbc6deece00e885f2. --- .../python/mllib/stratified_sampling_example.py | 38 ---------------------- 1 file changed, 38 deletions(-) delete mode 100644 examples/src/main/python/mllib/stratified_sampling_example.py (limited to 'examples/src/main/python/mllib/stratified_sampling_example.py') diff --git a/examples/src/main/python/mllib/stratified_sampling_example.py b/examples/src/main/python/mllib/stratified_sampling_example.py deleted file mode 100644 index a13f8f08dd..0000000000 --- a/examples/src/main/python/mllib/stratified_sampling_example.py +++ /dev/null @@ -1,38 +0,0 @@ -# -# Licensed to the Apache Software Foundation (ASF) under one or more -# contributor license agreements. See the NOTICE file distributed with -# this work for additional information regarding copyright ownership. -# The ASF licenses this file to You under the Apache License, Version 2.0 -# (the "License"); you may not use this file except in compliance with -# the License. You may obtain a copy of the License at -# -# http://www.apache.org/licenses/LICENSE-2.0 -# -# Unless required by applicable law or agreed to in writing, software -# distributed under the License is distributed on an "AS IS" BASIS, -# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -# See the License for the specific language governing permissions and -# limitations under the License. -# - -from __future__ import print_function - -from pyspark import SparkContext - -if __name__ == "__main__": - sc = SparkContext(appName="StratifiedSamplingExample") # SparkContext - - # $example on$ - # an RDD of any key value pairs - data = sc.parallelize([(1, 'a'), (1, 'b'), (2, 'c'), (2, 'd'), (2, 'e'), (3, 'f')]) - - # specify the exact fraction desired from each key as a dictionary - fractions = {1: 0.1, 2: 0.6, 3: 0.3} - - approxSample = data.sampleByKey(False, fractions) - # $example off$ - - for each in approxSample.collect(): - print(each) - - sc.stop() -- cgit v1.2.3