diff --git a/scripts/auto-ingest-protocols.sh b/scripts/auto-ingest-protocols.sh index d672156..745d33f 100755 --- a/scripts/auto-ingest-protocols.sh +++ b/scripts/auto-ingest-protocols.sh @@ -33,6 +33,68 @@ PROTO_TARGETS=( echo "=== auto-ingest-protocols $(date -Iseconds) ===" +# ─── HH: Index-Page-Scrape statt URL-Pattern ────────────────────────── +# Hamburg hat keine vorhersagbare URL-Pattern (Blob-IDs + Hashes). +# Stattdessen: Index-Seite scrapen, jedes gefundene PDF einzeln ingesten. +echo "--- HH WP23 (Index-Scrape) ---" +docker exec "$CONTAINER" python <