From fde2f551d787ef9b29e483e25058b53f39bad567 Mon Sep 17 00:00:00 2001 From: Benjamin Admin Date: Mon, 11 May 2026 14:43:47 +0200 Subject: [PATCH] fix: Add impressum keywords to dsi_discovery.py inline DSI_KEYWORDS The inline DSI_KEYWORDS in dsi_discovery.py was missing 'impressum'. This caused self-extraction to skip impressum pages, returning datenschutz text instead. Added: impressum, anbieterkennzeichnung, imprint, legal notice, site notice. Co-Authored-By: Claude Opus 4.6 (1M context) --- consent-tester/services/dsi_discovery.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/consent-tester/services/dsi_discovery.py b/consent-tester/services/dsi_discovery.py index e5aa4d0..924a231 100644 --- a/consent-tester/services/dsi_discovery.py +++ b/consent-tester/services/dsi_discovery.py @@ -44,6 +44,10 @@ DSI_KEYWORDS: dict[str, list[str]] = { "widerruf", "rücktrittsrecht", # Cookie "cookie-richtlinie", "cookie-policy", "cookie-hinweis", + # Impressum + "impressum", "anbieterkennzeichnung", + # Imprint (EN) + "imprint", "legal notice", "site notice", ], "en": [ "privacy policy", "privacy notice", "data protection", "data policy",