From 756d068b4f8f3524f197ec13bccdc03b6e3e62a9 Mon Sep 17 00:00:00 2001 From: Benjamin Admin Date: Mon, 13 Apr 2026 12:26:01 +0200 Subject: [PATCH] =?UTF-8?q?fix:=20skip=5Fweb=5Fsearch=20Default=20auf=20Tr?= =?UTF-8?q?ue=20=E2=80=94=205x=20schnellere=20Pipeline?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Anchor-Search (DuckDuckGo + RAG via SDK) verlangsamt Pipeline von ~50 Chunks/min auf ~10 Chunks/min. Anchors (OWASP/NIST-Referenzen) koennen nachtraeglich in einem Batch-Job befuellt werden. Co-Authored-By: Claude Opus 4.6 (1M context) --- control-pipeline/api/control_generator_routes.py | 2 +- control-pipeline/services/control_generator.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/control-pipeline/api/control_generator_routes.py b/control-pipeline/api/control_generator_routes.py index 0d95fcf..3a10dd4 100644 --- a/control-pipeline/api/control_generator_routes.py +++ b/control-pipeline/api/control_generator_routes.py @@ -52,7 +52,7 @@ class GenerateRequest(BaseModel): max_controls: int = 50 max_chunks: int = 1000 # Default: process max 1000 chunks per job (respects document boundaries) batch_size: int = 5 - skip_web_search: bool = False + skip_web_search: bool = True # Default True — Anchors nachtraeglich batchen dry_run: bool = False regulation_filter: Optional[List[str]] = None # Only process these regulation_code prefixes regulation_exclude: Optional[List[str]] = None # Skip these regulation_code prefixes diff --git a/control-pipeline/services/control_generator.py b/control-pipeline/services/control_generator.py index a05dacc..f1ac8d1 100644 --- a/control-pipeline/services/control_generator.py +++ b/control-pipeline/services/control_generator.py @@ -489,7 +489,7 @@ class GeneratorConfig(BaseModel): max_controls: int = 0 # 0 = unlimited (process ALL chunks) max_chunks: int = 0 # 0 = unlimited; >0 = stop after N chunks (respects document boundaries) skip_processed: bool = True - skip_web_search: bool = False + skip_web_search: bool = True # Default True — Anchor-Search verlangsamt 5x, nachtraeglich batchen dry_run: bool = False existing_job_id: Optional[str] = None # If set, reuse this job instead of creating a new one regulation_filter: Optional[List[str]] = None # Only process chunks matching these regulation_code prefixes