diff --git a/admin-compliance/app/api/sdk/compliance-advisor/chat/route.ts b/admin-compliance/app/api/sdk/compliance-advisor/chat/route.ts index 695ea00b..37b5c5ed 100644 --- a/admin-compliance/app/api/sdk/compliance-advisor/chat/route.ts +++ b/admin-compliance/app/api/sdk/compliance-advisor/chat/route.ts @@ -179,6 +179,9 @@ Der Nutzer hat "${countryLabel} (${validCountry})" gewaehlt. messages, stream: true, think: false, + // Modell im VRAM halten → kein Kaltstart bei der naechsten Frage + // (Kaltstart eines 35b-Modells war die Ursache fuer "Load failed"). + keep_alive: '30m', options: { temperature: 0.3, num_predict: 8192,