From 99b0d05b69515aedb3a00184c59fe37444ab5085 Mon Sep 17 00:00:00 2001 From: Andreas Romeyke <andreas.romeyke@slub-dresden.de> Date: Fri, 19 Apr 2024 17:28:16 +0200 Subject: [PATCH] - init --- analysis/LIESMICH.txt | 5 +++++ ...e_lzaid_dubletten_exkl_gel\303\266scht.sh" | 21 +++++++++++++++++++ 2 files changed, 26 insertions(+) create mode 100644 analysis/LIESMICH.txt create mode 100644 "analysis/finde_lzaid_dubletten_exkl_gel\303\266scht.sh" diff --git a/analysis/LIESMICH.txt b/analysis/LIESMICH.txt new file mode 100644 index 0000000..5094249 --- /dev/null +++ b/analysis/LIESMICH.txt @@ -0,0 +1,5 @@ +Das Script 'finde_lzaid_dubletten.sh' ist um mehrere Größenordnungen (im ms +Bereich) schneller +als 'bash analysis/finde_lzaid_dubletten_exkl_gelöscht.sh' (im s Bereich) + + diff --git "a/analysis/finde_lzaid_dubletten_exkl_gel\303\266scht.sh" "b/analysis/finde_lzaid_dubletten_exkl_gel\303\266scht.sh" new file mode 100644 index 0000000..331a09f --- /dev/null +++ "b/analysis/finde_lzaid_dubletten_exkl_gel\303\266scht.sh" @@ -0,0 +1,21 @@ +#!bin/bash + +sql1=$(cat <<'SQL1' +SELECT ie_id,lza_id,version,dir_path FROM aip where lza_id in ( + SELECT lza_id FROM ( + SELECT lza_id, COUNT(*) AS anzahl_ie_pids + FROM ( + SELECT ie_id, lza_id, COUNT(*) as versionen + FROM aip + GROUP BY ie_id, lza_id + ) WHERE aip.id NOT IN ( + SELECT aip_id FROM deleted + ) + GROUP BY lza_id + HAVING anzahl_ie_pids > 1 + ) +) ORDER BY lza_id +SQL1 +) + +echo "${sql1}" | sqlite3 "$1" -- GitLab