From 960b8e757c8ea95d7422752bc47084cddce99701 Mon Sep 17 00:00:00 2001 From: Benjamin Admin Date: Fri, 6 Mar 2026 08:35:53 +0100 Subject: [PATCH] fix(llm): qwen3.5 think:false + num_ctx 8192 in allen Chat/Draft-Routen MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Compliance Advisor, Drafting Agent und Validator haben nicht geantwortet weil qwen3.5 standardmaessig im Thinking-Mode laeuft (interne Chain-of- Thought > 2min Timeout). Keiner der Agenten benoetigt Thinking-Mode — alle Aufgaben sind Chat/Textgenerierung/JSON-Validierung ohne tiefes Reasoning. think:false sorgt fuer direkte schnelle Antworten. Co-Authored-By: Claude Sonnet 4.6 --- .../app/api/sdk/compliance-advisor/chat/route.ts | 2 ++ admin-compliance/app/api/sdk/drafting-engine/chat/route.ts | 2 ++ admin-compliance/app/api/sdk/drafting-engine/draft/route.ts | 6 ++++-- .../app/api/sdk/drafting-engine/validate/route.ts | 3 ++- 4 files changed, 10 insertions(+), 3 deletions(-) diff --git a/admin-compliance/app/api/sdk/compliance-advisor/chat/route.ts b/admin-compliance/app/api/sdk/compliance-advisor/chat/route.ts index 2fb92f0..695ea00 100644 --- a/admin-compliance/app/api/sdk/compliance-advisor/chat/route.ts +++ b/admin-compliance/app/api/sdk/compliance-advisor/chat/route.ts @@ -178,9 +178,11 @@ Der Nutzer hat "${countryLabel} (${validCountry})" gewaehlt. model: LLM_MODEL, messages, stream: true, + think: false, options: { temperature: 0.3, num_predict: 8192, + num_ctx: 8192, }, }), signal: AbortSignal.timeout(120000), diff --git a/admin-compliance/app/api/sdk/drafting-engine/chat/route.ts b/admin-compliance/app/api/sdk/drafting-engine/chat/route.ts index 3237271..04071cd 100644 --- a/admin-compliance/app/api/sdk/drafting-engine/chat/route.ts +++ b/admin-compliance/app/api/sdk/drafting-engine/chat/route.ts @@ -88,9 +88,11 @@ export async function POST(request: NextRequest) { model: LLM_MODEL, messages, stream: true, + think: false, options: { temperature: mode === 'draft' ? 0.2 : 0.3, num_predict: mode === 'draft' ? 16384 : 8192, + num_ctx: 8192, }, }), signal: AbortSignal.timeout(120000), diff --git a/admin-compliance/app/api/sdk/drafting-engine/draft/route.ts b/admin-compliance/app/api/sdk/drafting-engine/draft/route.ts index ea195df..b1293ff 100644 --- a/admin-compliance/app/api/sdk/drafting-engine/draft/route.ts +++ b/admin-compliance/app/api/sdk/drafting-engine/draft/route.ts @@ -131,7 +131,8 @@ async function handleV1Draft(body: Record): Promise