From 3b154c21cbd3a196d734196c0d60cce196530cea Mon Sep 17 00:00:00 2001 From: Felix Lohmeier Date: Tue, 2 Mar 2021 14:59:24 +0100 Subject: [PATCH] =?UTF-8?q?fix=20#27=20M=C3=BCnster:=20Linkcheck=20soll=20?= =?UTF-8?q?weitere=20Informationen=20ausgeben?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- Taskfile.yml | 13 +++++++------ 1 file changed, 7 insertions(+), 6 deletions(-) diff --git a/Taskfile.yml b/Taskfile.yml index 63dea3a..34a7327 100644 --- a/Taskfile.yml +++ b/Taskfile.yml @@ -168,14 +168,15 @@ tasks: cmds: - test -n "{{.PROJECT}}" # Links extrahieren - - xmllint --xpath '//@*[local-name(.) = "href"]' split/*.xml | cut -d '"' -f2 | sort | uniq > links.txt - # http status code aller Links ermitteln - - awk '{ print "url = " $0 "\noutput = /dev/null"; }' links.txt > curl.cfg - - curl --silent --head --location --write-out "%{http_code} %{url_effective}\n" --config curl.cfg > linkcheck.log + - grep -o 'href="[^"]*"' split/*.xml | sed 's/:href=/\t/' | tr -d '"' | sort -k 2 --unique > links.txt + # http status code ermitteln + - awk '{ print "url = " $2 "\noutput = /dev/null"; }' links.txt > curl.cfg + - curl --silent --head --location --write-out "%{http_code}\t%{url_effective}\n" --config curl.cfg > curl.log + # Tabelle mit status code, effektiver URL, Dateiname und start URL erstellen + - paste curl.log links.txt > linkcheck.log + - rm -rf curl.cfg curl.log links.txt # Logdatei auf status code != 2XX prüfen - if grep '^[^2]' linkcheck.log; then echo 1>&2 "Logdatei $PWD/linkcheck.log enthält problematische status codes!" && exit 1; fi - # Aufräumen bei Erfolg - - rm -rf curl.cfg links.txt sources: - split/*.xml generates: