From 8bd2368084eacaba1e35cc2e50bfd75f0736e44b Mon Sep 17 00:00:00 2001 From: Felix Lohmeier Date: Thu, 5 Jan 2017 18:01:09 +0100 Subject: [PATCH] Korrektur count-tsv Script --- scripte/count-tsv.sh | 12 +++--------- 1 file changed, 3 insertions(+), 9 deletions(-) diff --git a/scripte/count-tsv.sh b/scripte/count-tsv.sh index ca4a179..8dae673 100755 --- a/scripte/count-tsv.sh +++ b/scripte/count-tsv.sh @@ -10,26 +10,20 @@ if [ -z "$1" ] echo "Beispiel: ./count-tsv.sh file.tsv" exit else - echo "Folgende Dateien werden untersucht:" files=($*) - printf '%s\n' "${files[@]}" + printf '%s\n' MARC-Feld Vorkommen Mehrfachbelegung | paste -sd '\t' fi # Schleife für mehrere Dateien for file in "${files[@]}"; do - echo "" - echo $file - echo "" - printf '%-30s\t%-10s\t%-10s \n' "SPALTENNAME" "ZEILEN" "ZEILEN-MIT-␟" - # Spaltennamen erfassen - readarray columns < <(head -q -n1 ${file} | tr '\t' '\n' | cat) + readarray columns -t < <(head -q -n1 ${file} | tr -d ' ' | tr '\t' '\n' | cat) # Belegte Zellen in Spalten zählen und ausgeben number=1 for column in "${columns[@]}"; do - printf '%-30s\t%-10d\t%-10d \n' "${column}" $(cut -d$'\t' -f ${number} ${file} | grep -v '^$' | wc -l) $(cut -d$'\t' -f ${number} ${file} | grep '␟' | wc -l) + printf '%s\n' ${column} $(cut -d$'\t' -f ${number} ${file} | grep -v '^$' | wc -l) $(cut -d$'\t' -f ${number} ${file} | grep '␟' | wc -l) | paste -sd '\t' number=$(($number+1)) done done