aboutsummaryrefslogtreecommitdiff
path: root/dev/tests/pr_public_classes.sh
blob: 41c5d3ee8cb3c813525fbad42030e466c3bc0b45 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
#!/usr/bin/env bash

#
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements.  See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License.  You may obtain a copy of the License at
#
#    http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

#
# This script follows the base format for testing pull requests against
# another branch and returning results to be published. More details can be
# found at dev/run-tests-jenkins.
#
# Arg1: The Github Pull Request Actual Commit
#+ known as `ghprbActualCommit` in `run-tests-jenkins`

ghprbActualCommit="$1"

# $ghprbActualCommit is an automatic merge commit generated by GitHub; its parents are some Spark
# master commit and the tip of the pull request branch.

# By diffing$ghprbActualCommit^...$ghprbActualCommit and filtering to examine the diffs of only
# non-test files, we can gets us changes introduced in the PR and not anything else added to master
# since the PR was branched.

# Handle differences between GNU and BSD sed
if [[ $(uname) == "Darwin" ]]; then
    SED='sed -E'
else
    SED='sed -r'
fi

source_files=$(
  git diff $ghprbActualCommit^...$ghprbActualCommit --name-only  `# diff patch against master from branch point` \
    | grep -v -e "\/test"                               `# ignore files in test directories` \
    | grep -e "\.py$" -e "\.java$" -e "\.scala$"        `# include only code files` \
    | tr "\n" " "
)

new_public_classes=$(
  git diff $ghprbActualCommit^...$ghprbActualCommit ${source_files}      `# diff patch against master from branch point` \
    | grep "^\+"                              `# filter in only added lines` \
    | $SED -e "s/^\+//g"                      `# remove the leading +` \
    | grep -e "trait " -e "class "            `# filter in lines with these key words` \
    | grep -e "{" -e "("                      `# filter in lines with these key words, too` \
    | grep -v -e "\@\@" -e "private"          `# exclude lines with these words` \
    | grep -v -e "^// " -e "^/\*" -e "^ \* "  `# exclude comment lines` \
    | $SED -e "s/\{.*//g"                     `# remove from the { onwards` \
    | $SED -e "s/\}//g"                       `# just in case, remove }; they mess the JSON` \
    | $SED -e "s/\"/\\\\\"/g"                 `# escape double quotes; they mess the JSON` \
    | $SED -e "s/^(.*)$/\`\1\`/g"             `# surround with backticks for style` \
    | $SED -e "s/^/  \* /g"                   `# prepend '  *' to start of line` \
    | $SED -e "s/$/\\\n/g"                    `# append newline to end of line` \
    | tr -d "\n"                              `# remove actual LF characters`
)

if [ -z "$new_public_classes" ]; then
  echo " * This patch adds no public classes."
else
  public_classes_note=" * This patch adds the following public classes _(experimental)_:"
  echo -e "${public_classes_note}\n${new_public_classes}"
fi