-
Notifications
You must be signed in to change notification settings - Fork 17
/
Copy pathcheck_license_source_files.sh
executable file
·255 lines (219 loc) · 7.89 KB
/
check_license_source_files.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
#!/bin/bash
# Copyright 2022 Northern.tech AS
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
if [ -n "$DEBUG_MENDERTESTING" ]; then
set -x
fi
# This regular expression can be set in the '.gitlab-ci.yml' file, and is passed
# on to the find expression used to aggregate all the files to check for license
# headers.
LICENSE_HEADERS_IGNORE_FILES_REGEXP="${LICENSE_HEADERS_IGNORE_FILES_REGEXP:-none}"
usage() {
cat <<EOF
$(basename "$0") [--ent-start-commit=COMMIT]
Checks that all licenses in Go and Python files are correct.
--ent-start-commit=COMMIT
For an Enterprise repository, specifies the earliest commit that is part
of only Enterprise (the very first commit after the fork point).
If the FIRST_ENT_COMMIT env variable is set, the script uses its value for
the --ent-start-commit parameter.
Environment variables:
LICENSE_HEADERS_IGNORE_FILES_REGEXP:
A regexp passed on to
$(find . -type f \( ! -regex ${LICENSE_HEADERS_IGNORE_FILES_REGEXP} ...
and can therefore be used to ignore files in a repository.
EOF
}
ENT_COMMIT="${FIRST_ENT_COMMIT}"
while [ -n "$1" ]; do
case "$1" in
--ent-start-commit=*)
ENT_COMMIT="${1#--ent-start-commit=}"
;;
--ent-start-commit)
shift
ENT_COMMIT="$1"
;;
--verbose)
set -x
;;
*)
echo >&2 "Unrecognized option $1"
usage
exit 1
;;
esac
shift
done
is_enterprise() {
local file="$1"
if [ -z "$ENT_COMMIT" ]; then
# If there is no Enterprise commit specified, then this isn't an
# Enterprise repository, so everything is Open Source.
return 1
fi
# Find the latest commit that is not a descendant of the Enterprise
# commit. This should be the latest Open Source commit. This doesn't change
# over the course of a run, so cache it.
if [ -z "$LATEST_OS_COMMIT" ]; then
LATEST_OS_COMMIT=$(git rev-list $ENT_COMMIT..HEAD --ancestry-path --boundary --date-order \
| grep -v $ENT_COMMIT \
| grep "^-" \
| head -n1 \
| sed -e 's/[^0-9a-f]//')
if [ -z "$LATEST_OS_COMMIT" ]; then
# Very unlikely, but this can happen if every descendant commit of
# ENT_COMMIT has no other ancestor. This can only happen if:
#
# 1) Open Source has never been merged into the repo after the fork.
#
# 2) ENT_COMMIT was pushed directly to the repo, instead of being
# merged.
#
# If so, the correct commit to set is $ENT_COMMIT~1
LATEST_OS_COMMIT=$ENT_COMMIT~1
fi
fi
# There is no commit before ENT_COMMIT, all code is enterprise
if [ "$LATEST_OS_COMMIT" = "$ENT_COMMIT" ]; then
return 0
fi
if git show $LATEST_OS_COMMIT:"$file" >& /dev/null; then
# File exists, it's Open Source.
return 1
else
# File does not exist, it's Enterprise.
return 0
fi
}
TEST_RESULT=0
strip_hashbang() {
if [[ $# -ne 1 ]]; then
echo >&2 "strip_hashbang: Missing argument"
fi
tf=$(mktemp)
local -r file="${1}"
awk '!(NR == 1 && $1 ~/^#!.*/)' "${file}" > "${tf}"
echo "${tf}"
}
check_file() {
local file="$1"
local license
local lines
local lic_type
local -r CM="$2"
local rc
local -r tab=$'\t'
cat > license-os.tmp <<-EOF
${CM} Licensed under the Apache License, Version 2.0 (the "License");
${CM} you may not use this file except in compliance with the License.
${CM} You may obtain a copy of the License at
${CM}
${CM} http://www.apache.org/licenses/LICENSE-2.0
${CM}
${CM} Unless required by applicable law or agreed to in writing, software
${CM} distributed under the License is distributed on an "AS IS" BASIS,
${CM} WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
${CM} See the License for the specific language governing permissions and
${CM} limitations under the License.
EOF
LINES_OS=$(cat license-os.tmp | wc -l)
# we need to add two extra lines missing from the license preamble
# // Copyright <copyright_year> Northern.tech AS
# //
LINES_OS=$(($LINES_OS + 2))
cat > license-ent.tmp <<-EOF
${CM} All Rights Reserved
EOF
LINES_ENT=$(cat license-ent.tmp | wc -l)
# we need to add two extra lines missing from the license preamble
# // Copyright <copyright_year> Northern.tech AS
# //
LINES_ENT=$(($LINES_ENT + 2))
if is_enterprise ${file}; then
license="license-ent.tmp"
lines=$LINES_ENT
lic_type="Enterprise"
else
license="license-os.tmp"
lines=$LINES_OS
lic_type="Open Source"
fi
added_year=$(git log --follow --format=%ad --date=format:%Y --diff-filter=A -- "$file" | sort -n | tail -n 1)
orig_file="${file}"
file=$(strip_hashbang "${file}")
head -n $lines "$file" | tail -n +3 | diff -u "$license" - > /dev/null
rc=$?
if [[ $rc -ne 0 ]]; then
head -n $lines "$file" | sed -e "s/${tab}/ /g" | tail -n +3 | diff -u "$license" - > /dev/null
rc=$?
fi
if [ $rc -ne 0 ]; then
echo >&2 "!!! FAILED license check on ${orig_file}. Expected this $lic_type license:"
cat "$license" >&2
TEST_RESULT=1
else
copyright_year=$(grep -oP "${CM} Copyright \d{4} Northern.tech AS" "$file" | grep -oP "\d{4}")
if [ $copyright_year -ge $added_year ]; then
# Success!
:
else
echo >&2 "!!! FAILED license check on ${orig_file}; make sure copyright year is at least the year the file was first added to git ($added_year)"
TEST_RESULT=1
fi
fi
return ${TEST_RESULT}
}
check_files() {
if [[ ! $# -ge 1 ]]; then
echo >&2 "check_files requires one or more parameters"
fi
local -r SOURCE_FILES="$@"
for source_file in ${SOURCE_FILES}; do
case ${source_file} in
*.go|*.[ch]|*.[ch]pp)
CM='//'
;;
*.py|*.sh)
CM="#"
;;
*)
echo >&2 "No source file testing done for file:\n\t ${source_file}\nThe filetype is unsupported type"
TEST_RESULT=1
continue
;;
esac
check_file "${source_file}" "${CM}"
done
rm -f license-os.tmp license-ent.tmp
}
echo >&2 "LICENSE_HEADERS_IGNORE_FILES_REGEXP: ${LICENSE_HEADERS_IGNORE_FILES_REGEXP}"
echo >&2 "Checking licenses on all Go files"
GO_FILES="\
$(find . -type f ! -regex "${LICENSE_HEADERS_IGNORE_FILES_REGEXP}" ! -path '*/vendor/*' -name '*.go')
"
check_files "${GO_FILES}"
echo >&2 "Checking licenses on all Python files"
PYTHON_FILES="\
$(find . -type f ! -regex "${LICENSE_HEADERS_IGNORE_FILES_REGEXP}" ! -path '*/vendor/*' ! -regex '.*\.venv.*' ! -regex '.*build/.*' -name '*.py')"
check_files "${PYTHON_FILES}"
echo >&2 "Checking licenses on all Shell files"
SHELL_FILES="\
$(find . -type f ! -regex "${LICENSE_HEADERS_IGNORE_FILES_REGEXP}" ! -path '*/vendor/*' -name '*.sh')"
check_files "${SHELL_FILES}"
echo >&2 "Checking licenses on all C/C++ files"
C_FILES="\
$(find . -type f ! -regex "${LICENSE_HEADERS_IGNORE_FILES_REGEXP}" ! -path '*/vendor/*' \( -name '*.[ch]' -o -name '*.[ch]pp' \))"
check_files "${C_FILES}"
exit ${TEST_RESULT}