6
0
Fork 0
This repository has been archived on 2024-10-15. You can view files and clone it, but cannot push or open issues or pull requests.
fediversity_website_archive/scripts/check-all-links.sh

47 lines
1.4 KiB
Bash
Raw Normal View History

#!/bin/sh
set -eu
if [ -f ./check-all-links.tmp ]; then rm ./check-all-links.tmp; fi
2023-07-01 11:34:27 +02:00
if [ -d ./public ]; then
2023-07-01 11:34:27 +02:00
# Recursief zoeken, case-insentive, alleen de woorden die matchen, bestandsnaam niet tonen
# Alleen de items tonen die starten met http
# Strip items die eindigen met een \ (o.a. uit feed.json)
# Strip items die eindigen met een \n en aanvullende tekst (b.v. in abstracts)
# Negeer items van GitHub/Schema.org
# Sorten en uniek maken van de lijst
grep -ri --only-matching --no-filename "https://[a-zA-Z0-9]*\.\([a-z0-9\.\_/~-]\)*" ./public \
| grep "^http" \
| sed 's/\\$//' \
| sed 's/\\n.*$//' \
| grep -v 'https://github.com/NLUUG/website' \
| grep -v 'https://schema.org' \
| sort --unique > check-all-links.tmp
# URL's testen
if [ -f ./check-all-links.tmp ]; then
for URL in $(cat ./check-all-links.tmp); do
HTTP_CODE=$(curl -s -o /dev/null -w "%{http_code}" "${URL}")
if [ ! "${HTTP_CODE}" = "200" ]; then
echo "[WARNING] ${URL} (HTTP: ${HTTP_CODE})"
fi
sleep 2
done
else
echo "Kan bestand met links niet vinden."
exit 1
fi
else
echo "Dit script dient gedraaid te worden in de hoofddirectory van de website."
exit 1
fi
if [ -f ./check-all-links.tmp ]; then rm ./check-all-links.tmp; fi
exit 0
# EOF