gentoo-asahi-releng/scripts/copy_buildsync.sh

352 lines
9.5 KiB
Bash
Raw Normal View History

2012-07-09 17:47:42 +00:00
#!/bin/bash
# Where artifacts are uploaded by builders.
INCOMING_BASE="/release/weekly/builds"
# Where artifacts are moved to so they can be uploaded to mirrors.
OUTGOING_BASE="/release/distfiles/weekly"
# Scratch space used when moving files from incoming to outgoing.
TMPDIR_BASE="/release/distfiles/tmp/buildsync/partial"
# Keep some records
LOGDIR_BASE="/release/distfiles/tmp/buildsync/logs"
ARCHES=(
alpha
amd64
arm
arm64
hppa
ia64
loong
mips
m68k
ppc
riscv
s390
sh
sparc
x86
)
RSYNC_OPTS=(
-aO
--delay-updates
)
# Command line for `find` to figure out what files are release artifacts.
EXTENSIONS=(
'('
-name '*.tar.xz' -o
-name '*.tar.bz2' -o
-name '*.tar.gz' -o
-name '*.tar' -o
-name '*.sfs'
')'
)
2012-07-09 17:47:42 +00:00
OUT_STAGE3="latest-stage3.txt"
OUT_ISO="latest-iso.txt"
# Nothing to edit beyond this point
DEBUGP=
VERBOSEP=
usage() {
cat <<EOF
Usage: $0 [options]
Move releases from the incoming upload directory to the outgoing release
directory so they can be pushed out to mirrors.
Also update the "latest" links/files so people can easily find the current
version for any particular arch/release.
Options:
-v, --verbose Run in verbose mode
-d, --debug Run in debug mode
EOF
exit "${1:-1}"
}
# Copy artifacts for an arch to the outgoing directory.
copy_arch_to_outgoing() {
local ARCH=$1 indir=$2 outdir=$3 tmpdir=$4 logdir=$5
local i t rc timestamps
if [[ ! -d ${indir} ]]; then
# Nothing to do for this arch.
return
fi
# Copying
timestamps=( $(
find "${indir}" \
-regextype posix-egrep \
-type f \
-regex '.*-20[0123][0-9]{5}(([0-9]{6})|(T[0-9]{6}Z))?.*' \
\( -not -path '*/\.*' \) \
| sed -e 's:^.*-\(20[^.]\+\).*$:\1:' \
| sort -ur
) )
for i in "${timestamps[@]}" ; do
#echo "Doing $i"
t="${outdir}/${i}"
mkdir -p "${t}" 2>/dev/null
rsync \
"${RSYNC_OPTS[@]}" \
--temp-dir="${tmpdir}" \
--partial-dir="${tmpdir}" \
--log-file="${logdir}/rsync.log" \
--filter '- **/.*' \
--filter "S *${i}*" \
--filter 'S **/' \
--filter 'H *' \
"${indir}"/ \
"${t}"
rc=$?
if [ $rc -eq 0 ]; then
find "${indir}" \
-type f \
-name "*${i}*" \
\( -not -path '*/\.*' \) \
-print0 \
| xargs -0 --no-run-if-empty \
$DEBUGP rm $VERBOSEP -f
else
echo "Not deleting ${indir}/*${i}*, rsync failed!" 1>&2
fail=1
fi
done
find "${outdir}" \
-depth \
-mindepth 1 \
-type d \
-exec rmdir --ignore-fail-on-non-empty {} +
}
process_arch() {
local ARCH=$1
2012-07-09 17:47:42 +00:00
fail=0
indir="${INCOMING_BASE}/${ARCH}"
outdir="${OUTGOING_BASE}/${ARCH}"
tmpdir="${TMPDIR_BASE}/${ARCH}"
logdir="${LOGDIR_BASE}/${ARCH}"
2012-07-09 17:47:42 +00:00
mkdir -p "${tmpdir}" "${logdir}" 2>/dev/null
# Sync incoming->outgoing first.
copy_arch_to_outgoing "${ARCH}" "${indir}" "${outdir}" "${tmpdir}" "${logdir}"
2012-07-09 17:47:42 +00:00
# ================================================================
# Build data for revealing latest:
# *.iso
# stage3*bz2
cd "${outdir}"
# %T@
iso_list="$(find 20* -name '*.iso' -printf '%h %f %h/%f\n' 2>/dev/null |grep -v hardened | sort -n)"
stage3_list=$(find 20* -name "stage3*" -a "${EXTENSIONS[@]}" -printf '%h %f %h/%f\n' 2>/dev/null| grep -v hardened | sort -n)
2012-07-09 17:47:42 +00:00
latest_iso_date="$(echo -e "${iso_list}" |awk '{print $1}' |cut -d/ -f1 | tail -n1)"
latest_stage3_date="$(echo -e "${stage3_list}" |awk '{print $1}' |cut -d/ -f1 | tail -n1)"
header="$(echo -e "# Latest as of $(date -uR)\n# ts=$(date -u +%s)")"
2013-04-18 08:04:50 +00:00
2012-07-09 17:47:42 +00:00
# Do not remove this
[ -z "${latest_iso_date}" ] && latest_iso_date="NONE-FOUND"
[ -z "${latest_stage3_date}" ] && latest_stage3_date="NONE-FOUND"
2013-04-18 08:04:50 +00:00
OUT_ISO_tmp=""
OUT_STAGE3_tmp=""
2012-07-09 17:47:42 +00:00
if [ -n "${iso_list}" ]; then
OUT_ISO_tmp=$(mktemp -p . -t ".${OUT_ISO}.XXXXXX")
chmod 644 "${OUT_ISO_tmp}"
echo -e "${header}" >"${OUT_ISO_tmp}"
# Some arches produce more than one type of iso.
# So let's not advertise a current one via a symlink in general.
rm -f current-iso
2012-07-09 17:47:42 +00:00
fi
if [ -n "${stage3_list}" ]; then
OUT_STAGE3_tmp=$(mktemp -p . -t ".${OUT_STAGE3}.XXXXXX")
chmod 644 "${OUT_STAGE3_tmp}"
echo -e "${header}" >"${OUT_STAGE3_tmp}"
# Ditto for stage3
rm -f current-stage3
2012-07-09 17:47:42 +00:00
fi
2013-04-18 08:04:50 +00:00
# New variant preserve code
find_variants=( '(' -iname '*.iso' -o -name 'netboot-*' -o "${EXTENSIONS[@]}" ')' )
variants=$(find 20* "${find_variants[@]}" -printf '%f\n' 2>/dev/null | sed -e 's,-20[012][0-9]\{5\}.*,,g' -r | sort -u)
# This file specifies which variants are still in use.
keepfile="${tmpdir}/.keep.${ARCH}.txt"
keepfile_tmp=$(mktemp -p "${tmpdir}" -t ".keep.${ARCH}.txt.XXXXXX")
echo -n '' >"${keepfile_tmp}"
chmod 644 "${keepfile_tmp}"
2013-04-18 08:04:50 +00:00
for v in $variants ; do
# FIXME: trace the $a variable in this!
# example output 20230907T160230Z/install-alpha-minimal-20230907T160230Z.iso
variant_path=$(find 20* -iname "${v}-20*" "${find_variants[@]}" -print 2>/dev/null | sed -e "s,.*/$a/autobuilds/,,g" | sort -k1,1 -t/ | tail -n1 )
if [ -z "${variant_path}" ] || [ ! -e "${variant_path}" ]; then
echo "$ARCH: Variant ${v} is missing" 1>&2
continue
fi
variant_date="${variant_path%/*}"
variant_base="${variant_path#*/}"
size=$(stat --format='%s' "${variant_path}")
2012-07-09 17:47:42 +00:00
f="latest-${v}.txt"
f_tmp=$(mktemp -p . -t ".${f}.XXXXXX")
chmod 644 "${f_tmp}"
echo -e "${header}" >"${f_tmp}"
echo -e "${variant_path} ${size}" >>"${f_tmp}"
[[ ${variant_path} =~ tar.*$ ]] && echo -e "${variant_path} ${size}" >>"${OUT_STAGE3_tmp}"
[[ ${variant_path} =~ iso$ ]] && echo -e "${variant_path} ${size}" >>"${OUT_ISO_tmp}"
# Previously, current-${v}/ was a symlink to the timestamp directory.
# This was apparently confusing to some users because it had way too many files.
# So instead make current-${v}/ a directory, containing just symlinks to
# the selected build.
#
# Link the files for a given variant into a current-${v}/ directory.
# If it's an old link, remove to convert to directory.
if test -L "current-$v" ; then rm "current-$v" ; fi
# If there is a file here, something went wrong.
if ! mkdir -p "current-$v" ; then
echo "$ARCH: could not mkdir current-${v}" 1>&2
continue
fi
# Remove old links in the directory.
find "current-$v" \
-type l \
! -name "$f" \
! -name "*${variant_date}*" \
-delete
# install new links
# do NOT unconditionally use -f here, we do not want to override the
# existing files. this will ensure the mtime of the links does not change
# in most cases.
(
# shellcheck disable=SC2164 # error-checked above
cd "current-$v"
for variant_file in "../${variant_path}"* ; do
doit=0
vfb=$(basename "$variant_file")
# If it doesn't exist, add it.
if [[ ! -e "$vfb" ]]; then
doit=1
else
# If it does exist, check carefully to see if anything is different
# Does it point to somewhere else?
# Is the target newer?
# If those are true, also bump the symlink.
vft=$(readlink -f "$vfb")
[[ "$vft" != "$(readlink -f "$variant_file")" ]] && doit=1
[[ "$vfb" -nt "$vft" ]] && doit=1
fi
[[ $doit -eq 1 ]] && ln -sf -t . "${variant_file}"
done
)
# Update keepfile
echo "${variant_path}" | sed -e 's,/.*,,g' -e 's,^,/,g' -e 's,$,$,g' >>"${keepfile_tmp}"
# Place latest-*txt into place in the base arch dir.
mv -f "${f_tmp}" "${f}"
# current-${variant}/latest-${variant}.txt contains the RELATIVE filename
# So we have to strip the leading directory on the path.
# reuse the tmpfile from $f
sed "s,^${variant_date}/,,g" <"${f}" >"${f_tmp}" && mv -f "${f_tmp}" "current-$v"/"${f}"
2013-04-18 08:04:50 +00:00
done
# Atomic move these files if created.
[[ -n "${OUT_ISO_tmp}" ]] && [[ -f "${OUT_ISO_tmp}" ]] && mv "${OUT_ISO_tmp}" "${OUT_ISO}"
[[ -n "${OUT_STAGE3_tmp}" ]] && [[ -f "${OUT_STAGE3_tmp}" ]] && mv "${OUT_STAGE3_tmp}" "${OUT_STAGE3}"
# Refresh keepfile
mv -f "${keepfile_tmp}" "${keepfile}"
2012-07-09 17:47:42 +00:00
# ================================================================
# Cleanup
if [ $fail -eq 0 ]; then
2012-07-09 17:47:42 +00:00
# Clean up all but latest 4 from mirror dir
cd "${outdir}"
for i in $(find . -regextype posix-basic -mindepth 1 -maxdepth 1 -type d -regex '.*20[012][0-9]\{5\}.*' \
2012-07-09 17:47:42 +00:00
| sed -e 's:^.*-\(20[^.]\+\).*$:\1:' \
| sort -ur \
| grep -E -v -e "/${latest_iso_date}\$|/${latest_stage3_date}\$" \
| grep -E -v -f "${keepfile}" \
2012-07-09 17:47:42 +00:00
| tail -n +5); do
$DEBUGP rm $VERBOSEP -rf "$(pwd)"/"${i}"
2012-07-09 17:47:42 +00:00
done
2013-04-18 08:04:50 +00:00
# Preserve the keepfile for review
cp -lf "${keepfile}" "${outdir}"
# Find the dead links for cleanup
_dead="${tmpdir}"/dead-link
find -L $(pwd) -type l >"${_dead}"
mv -f "${_dead}" "${logdir}/dead-links.txt"
# Find the dead latest txt files
_dead="${tmpdir}"/dead-latest
for f in $(find "${outdir}" -name 'latest*txt' ) ; do
d=$(dirname $f)
find $d \
| fgrep -f <(awk '/^#/{next} {print $1}' $f) \
| sed "s,${d}/,,g" \
| sort \
| comm -13 \
- \
<(sort $f |grep -v -e '^#' |awk '{print $1}') \
| fgrep -l -f - $f \
| xargs -n1 --no-run-if-empty readlink -f
done >"${_dead}"
mv -f "${_dead}" "${logdir}/dead-latest-txt.txt"
# Cleanup tmpdir
$DEBUGP rm $VERBOSEP -rf "${tmpdir}"
2012-07-09 17:47:42 +00:00
else
echo "There was some failure for $ARCH during the weekly sync. Not doing cleanup for fear of dataloss." 1>&2
echo "See logs in $logdir" 1>&2
2012-07-09 17:47:42 +00:00
fi
}
2012-07-09 17:47:42 +00:00
main() {
# Process all the command line options first.
while [[ $# -ne 0 ]]; do
case $1 in
-d|--debug)
DEBUGP="echo"
RSYNC_OPTS+=( -n )
;;
-v|--verbose)
VERBOSEP="-v"
RSYNC_OPTS+=( -v )
;;
-h|--help)
usage 0
;;
*)
usage 1
;;
esac
shift
done
# Process all the architectures.
local arch
for arch in "${ARCHES[@]}"; do
process_arch "${arch}"
done
}
main "$@"
2012-07-09 17:47:42 +00:00
# vim:ts=2 sw=2 noet ft=sh: