-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathpublish.sh
executable file
·103 lines (83 loc) · 2.94 KB
/
publish.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
#!/bin/bash
#set -o errexit # abort on nonzero exitstatus
set -o nounset # abort on unbound variable
set -o pipefail # don't hide errors within pipes
# if no argument is provided, print an error message and exit
if [ $# -eq 0 ]
then
echo "No repository file supplied. Please provide the path to the csv file."
exit 1
fi
# Clean any existing files in the data directory
if [ -d "$DATA_DIR" ]; then
rm -rf "${DATA_DIR:?}"/*
fi
# Create the data directory and partition directory
PARTITION_DIR="$DATA_DIR/partitions"
mkdir -p "$PARTITION_DIR"
CSV_FILE="$DATA_DIR/$1"
cp "$1" "$DATA_DIR"
# split csv file into 10 line chunks.
# the chunks should be named `repos-{chunk}`
# the csv file will contain two columns: url and branch
# capture the first row as the header and save to var
header=$(head -n 1 "$CSV_FILE")
cd "$PARTITION_DIR" || exit
split -l 10 "$CSV_FILE" repos-
# ensure each chunk has the header row
for file in repos-*
do
if [ "$(head -n 1 "$file")" != "$header" ]; then
echo "$header" | cat - "$file" > temp && mv temp "$file"
fi
done
# counter init to 0
index=0
function build_and_upload_repos() {
# for each chunk, read the contents of the csv file
for file in repos-*
do
if [ "$(head -n 1 "$file")" != "$header" ]; then
# prepend header to the file
echo "$header" | cat - "$file" > temp && mv temp "$file"
fi
# extract just the partition name from the file name
partition_name=$(echo "$file" | cut -d'-' -f2)
# if cloning failed, skip the rest of the loop
if ! mod git clone csv "$partition_name" "$file" --filter=tree:0; then
printf "[%d][%s] Cloning failed, skipping partition\n" $index "$partition_name"
continue
fi
mod build "./$partition_name" --no-download
mod publish "./$partition_name"
mod log builds add "./$partition_name" log.zip --last-build
# if directory exists, remove it
if [ -d "./$partition_name" ]; then
rm -rf "./$partition_name"
fi
done
# if PUBLISH_USER and PUBLISH_PASSWORD and PUBLISH_UR, or PUBLISH_TOKEN are set, publish logs
if [ "$PUBLISH_URL" ]; then
log_version=$(date '+%Y%m%d%H%M%S')
if [ "$PUBLISH_USER" ] && [ "$PUBLISH_PASSWORD" ]; then
curl --insecure -u "$PUBLISH_USER":"$PUBLISH_PASSWORD" -X PUT \
"$PUBLISH_URL/$log_version/ingest-log-$log_version.zip" \
-T log.zip
elif [ "$PUBLISH_TOKEN" ]; then
curl --insecure --header "Authorization: Bearer $PUBLISH_TOKEN" -X PUT \
"$PUBLISH_URL/$log_version/ingest-log-$log_version.zip" \
-T log.zip
else
printf "[%d] No log publishing credentials for %s provided\n" $index $PUBLISH_URL
fi
else
printf "[%d] No log publishing credentials or URL provided\n" $index
fi
# increment index
index=$((index+1))
}
# Continuously build and upload repositories in a loop
# If you'd like to run this script once, or on a schedule, remove the while loop
while true; do
build_and_upload_repos
done