#!/usr/bin/env bash

#
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements.  See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License.  You may obtain a copy of the License at
#
#    http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

# Go to the Spark project root directory
FWDIR="$(cd `dirname $0`/..; pwd)"
cd $FWDIR

# Remove work directory
rm -rf ./work

if test -x "$JAVA_HOME/bin/java"; then
    declare java_cmd="$JAVA_HOME/bin/java"
else 
    declare java_cmd=java
fi
JAVA_VERSION=$($java_cmd -version 2>&1 | sed 's/java version "\(.*\)\.\(.*\)\..*"/\1\2/; 1q')
[ "$JAVA_VERSION" -ge 18 ] && echo "" || echo "[Warn] Java 8 tests will not run because JDK version is < 1.8."

# Partial solution for SPARK-1455. Only run Hive tests if there are sql changes.
if [ -n "$AMPLAB_JENKINS" ]; then
  git fetch origin master:master
  diffs=`git diff --dirstat master | awk '{ print $2; }' | grep "^sql/"`
  if [ -n "$diffs" ]; then
    echo "Detected changes in SQL. Will run Hive test suite."
    export _RUN_SQL_TESTS=true # exported for PySpark tests
  fi
fi

# Fail fast
set -e
set -o pipefail

echo "========================================================================="
echo "Running Apache RAT checks"
echo "========================================================================="
dev/check-license

echo "========================================================================="
echo "Running Scala style checks"
echo "========================================================================="
dev/scalastyle

echo "========================================================================="
echo "Running Spark unit tests"
echo "========================================================================="
# echo "q" is needed because sbt on encountering a build file with failure 
# (either resolution or compilation) prompts the user for input either q, r, 
# etc to quit or retry. This echo is there to make it not block.
if [ -n "$_RUN_SQL_TESTS" ]; then
  echo -e "q\n" | SPARK_HIVE=true sbt/sbt clean assembly test | \
    grep -v -e "info.*Resolving" -e "warn.*Merging" -e "info.*Including"
else
  echo -e "q\n" | sbt/sbt clean assembly test | \
    grep -v -e "info.*Resolving" -e "warn.*Merging" -e "info.*Including"
fi

echo "========================================================================="
echo "Running PySpark tests"
echo "========================================================================="
./python/run-tests

echo "========================================================================="
echo "Detecting binary incompatibilites with MiMa"
echo "========================================================================="
dev/mima