curl training.galaxyproject.org/sitemap.xml | xpath -q -e '//url/loc/text()' | \

grep -v '/training-material/api/' | \
egrep -v '\.ya?ml$' | \
grep -v 'slides-plain.html$' | \
sed 's|https://training.galaxyproject.org|http://localhost:4002|' > /tmp/urls

for x in `cat /tmp/urls`; do

resp=$(curl -s -w "%{http_code}\n" $x -o /dev/null);
if (( resp != 200 )); then
        echo $x; 
fi;

done