aboutsummaryrefslogtreecommitdiff
path: root/pyspark
diff options
context:
space:
mode:
authorJosh Rosen <joshrosen@eecs.berkeley.edu>2013-01-01 21:25:49 -0800
committerJosh Rosen <joshrosen@eecs.berkeley.edu>2013-01-01 21:25:49 -0800
commitce9f1bbe20eff794cd1d588dc88f109d32588cfe (patch)
treeff840eea62e8314dc4cefcaa08534c4b21e544ba /pyspark
parentb58340dbd9a741331fc4c3829b08c093560056c2 (diff)
downloadspark-ce9f1bbe20eff794cd1d588dc88f109d32588cfe.tar.gz
spark-ce9f1bbe20eff794cd1d588dc88f109d32588cfe.tar.bz2
spark-ce9f1bbe20eff794cd1d588dc88f109d32588cfe.zip
Add `pyspark` script to replace the other scripts.
Expand the PySpark programming guide.
Diffstat (limited to 'pyspark')
-rwxr-xr-xpyspark32
1 files changed, 32 insertions, 0 deletions
diff --git a/pyspark b/pyspark
new file mode 100755
index 0000000000..9e89d51ba2
--- /dev/null
+++ b/pyspark
@@ -0,0 +1,32 @@
+#!/usr/bin/env bash
+
+# Figure out where the Scala framework is installed
+FWDIR="$(cd `dirname $0`; pwd)"
+
+# Export this as SPARK_HOME
+export SPARK_HOME="$FWDIR"
+
+# Load environment variables from conf/spark-env.sh, if it exists
+if [ -e $FWDIR/conf/spark-env.sh ] ; then
+ . $FWDIR/conf/spark-env.sh
+fi
+
+# Figure out which Python executable to use
+if [ -z "$PYSPARK_PYTHON" ] ; then
+ PYSPARK_PYTHON="python"
+fi
+export PYSPARK_PYTHON
+
+# Add the PySpark classes to the Python path:
+export PYTHONPATH=$SPARK_HOME/python/:$PYTHONPATH
+
+# Load the PySpark shell.py script when ./pyspark is used interactively:
+export OLD_PYTHONSTARTUP=$PYTHONSTARTUP
+export PYTHONSTARTUP=$FWDIR/python/pyspark/shell.py
+
+# Launch with `scala` by default:
+if [[ "$SPARK_LAUNCH_WITH_SCALA" != "0" ]] ; then
+ export SPARK_LAUNCH_WITH_SCALA=1
+fi
+
+exec "$PYSPARK_PYTHON" "$@"