From 8442115e7c22f3a34ad1ffe9e4f89da1770f66e8 Mon Sep 17 00:00:00 2001 From: Benjamin Admin Date: Thu, 12 Mar 2026 16:44:15 +0100 Subject: [PATCH] fix(rag): Fix bash compatibility + missing mkdir in phase functions MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit - Replace ${var,,} (bash 4+) with $(echo | tr) for macOS bash 3.2 compat - Add mkdir -p to phase_gesetze, phase_eu, phase_templates, phase_datenschutz, phase_dach — prevents download failures when running phases individually Co-Authored-By: Claude Opus 4.6 --- scripts/ingest-legal-corpus.sh | 9 +++++++-- 1 file changed, 7 insertions(+), 2 deletions(-) diff --git a/scripts/ingest-legal-corpus.sh b/scripts/ingest-legal-corpus.sh index 9bd8271..ac7b84f 100755 --- a/scripts/ingest-legal-corpus.sh +++ b/scripts/ingest-legal-corpus.sh @@ -448,6 +448,7 @@ phase_gesetze() { log "==========================================" log "PHASE B: Deutsche Gesetze → bp_compliance_gesetze" log "==========================================" + mkdir -p "$WORK_DIR"/{pdfs,texts} local col="bp_compliance_gesetze" local before @@ -502,6 +503,7 @@ phase_eu() { log "==========================================" log "PHASE C: EU-Rechtstexte → bp_compliance_ce" log "==========================================" + mkdir -p "$WORK_DIR"/{pdfs,texts} local col="bp_compliance_ce" local before @@ -532,6 +534,7 @@ phase_templates() { log "==========================================" log "PHASE D: Templates → bp_legal_templates" log "==========================================" + mkdir -p "$WORK_DIR"/{pdfs,texts,repos} local col="bp_legal_templates" local before @@ -769,6 +772,7 @@ phase_datenschutz() { log "==========================================" log "PHASE E: Datenschutz-Guidance → bp_compliance_datenschutz" log "==========================================" + mkdir -p "$WORK_DIR"/{pdfs,texts} local col="bp_compliance_datenschutz" local before @@ -864,7 +868,7 @@ phase_verbraucherschutz() { if [[ -f "$pdf_file" ]]; then upload_file "$pdf_file" "$col" "compliance" "legal_reference" "2025" \ - "{\"regulation_id\":\"${short,,}\",\"regulation_name_de\":\"$fullname ($short)\",\"category\":\"$category\",\"license\":\"public_domain_§5_UrhG\",\"source\":\"gesetze-im-internet.de\"}" \ + "{\"regulation_id\":\"$(echo "$short" | tr '[:upper:]' '[:lower:]')\",\"regulation_name_de\":\"$fullname ($short)\",\"category\":\"$category\",\"license\":\"public_domain_§5_UrhG\",\"source\":\"gesetze-im-internet.de\"}" \ "$short ($fullname)" fi done @@ -1129,7 +1133,7 @@ with open('$WORK_DIR/pdfs/EGBGB_Widerruf.txt', 'w') as f: if [[ -f "$pdf_file" ]]; then upload_file "$pdf_file" "$col" "compliance_ce" "legal_reference" "$year" \ - "{\"regulation_id\":\"${short,,}\",\"regulation_name_de\":\"$name_de\",\"regulation_name_en\":\"$name_en\",\"regulation_short\":\"$short\",\"celex\":\"$celex\",\"category\":\"$category\",\"license\":\"CC_BY_4.0\",\"source\":\"eur-lex\"}" \ + "{\"regulation_id\":\"$(echo "$short" | tr '[:upper:]' '[:lower:]')\",\"regulation_name_de\":\"$name_de\",\"regulation_name_en\":\"$name_en\",\"regulation_short\":\"$short\",\"celex\":\"$celex\",\"category\":\"$category\",\"license\":\"CC_BY_4.0\",\"source\":\"eur-lex\"}" \ "$short — $name_de" fi done @@ -1201,6 +1205,7 @@ phase_dach() { log "==========================================" log "PHASE I: DACH-Erweiterung" log "==========================================" + mkdir -p "$WORK_DIR"/{pdfs,texts} # ========================================================================= # I1: Fehlende DE-Gesetze → bp_compliance_gesetze