feat: Investor Agent — FAQ als LLM-Kontext statt Direkt-Streaming

Architektur-Umbau: FAQ-Antworten werden NICHT mehr direkt gestreamt. Stattdessen werden die Top-3 relevanten FAQ-Einträge als Kontext ans LLM übergeben. Das LLM interpretiert die Frage, kombiniert mehrere FAQs bei komplexen Fragen und antwortet natürlich. Vorher: Frage → Keyword-Match → FAQ direkt streamen (LLM umgangen) Nachher: Frage → Top-3 FAQ-Matches → LLM-Prompt als Kontext → LLM antwortet Neue Funktionen: - matchFAQMultiple(): Top-N Matches statt nur bester - buildFAQContext(): Baut Kontext-String für LLM-Injection - faqContext statt faqAnswer im Request-Body - System-Prompt Anweisung: "Kombiniere bei Bedarf, natürlicher Fließtext" Behebt: Komplexe Fragen mit 2+ Themen werden jetzt korrekt beantwortet Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
2026-03-28 10:57:47 +01:00
parent 928556aa89
commit 34d2529e04
3 changed files with 44 additions and 54 deletions
@@ -157,42 +157,12 @@ ${JSON.stringify(features.rows, null, 2)}
 export async function POST(request: NextRequest) {
  try {
    const body = await request.json()
-    const { message, history = [], lang = 'de', slideContext, faqAnswer } = body
+    const { message, history = [], lang = 'de', slideContext, faqContext } = body

    if (!message || typeof message !== 'string') {
      return NextResponse.json({ error: 'Message is required' }, { status: 400 })
    }

-    // FAQ shortcut: if client sends a pre-cached FAQ answer, stream it directly (no LLM call)
-    if (faqAnswer && typeof faqAnswer === 'string') {
-      const encoder = new TextEncoder()
-      const stream = new ReadableStream({
-        start(controller) {
-          // Stream the FAQ answer in chunks for consistent UX
-          const words = faqAnswer.split(' ')
-          let i = 0
-          const interval = setInterval(() => {
-            if (i < words.length) {
-              const chunk = (i === 0 ? '' : ' ') + words[i]
-              controller.enqueue(encoder.encode(chunk))
-              i++
-            } else {
-              clearInterval(interval)
-              controller.close()
-            }
-          }, 30)
-        },
-      })
-
-      return new NextResponse(stream, {
-        headers: {
-          'Content-Type': 'text/plain; charset=utf-8',
-          'Cache-Control': 'no-cache',
-          'Connection': 'keep-alive',
-        },
-      })
-    }
-
    const pitchContext = await loadPitchContext()

    let systemContent = SYSTEM_PROMPT
@@ -200,6 +170,11 @@ export async function POST(request: NextRequest) {
      systemContent += '\n' + pitchContext
    }

+    // FAQ context: relevant pre-researched answers as basis for the LLM
+    if (faqContext && typeof faqContext === 'string') {
+      systemContent += '\n' + faqContext
+    }
+
    // Slide context for contextual awareness
    if (slideContext) {
      const visited: number[] = slideContext.visitedSlides || []
@@ -7,7 +7,7 @@ import { ChatMessage, Language, SlideId } from '@/lib/types'
 import { t } from '@/lib/i18n'
 import { SLIDE_ORDER } from '@/lib/hooks/useSlideNavigation'
 import { PresenterState } from '@/lib/presenter/types'
-import { matchFAQ, getFAQAnswer } from '@/lib/presenter/faq-matcher'
+import { matchFAQMultiple, buildFAQContext } from '@/lib/presenter/faq-matcher'

 interface ChatFABProps {
  lang: Language
@@ -227,8 +227,9 @@ export default function ChatFAB({
    setIsStreaming(true)
    setIsWaiting(true)

-    // Check FAQ first for instant response
-    const faqMatch = matchFAQ(message, lang)
+    // Find relevant FAQ entries as context for the LLM
+    const faqMatches = matchFAQMultiple(message, lang, 3)
+    const faqContext = buildFAQContext(faqMatches, lang)

    abortRef.current = new AbortController()

@@ -245,9 +246,9 @@ export default function ChatFAB({
        },
      }

-      // If FAQ matched, send the cached answer for fast streaming (no LLM call)
-      if (faqMatch) {
-        requestBody.faqAnswer = getFAQAnswer(faqMatch, lang)
+      // Send FAQ context to LLM (not direct streaming — LLM interprets and combines)
+      if (faqContext) {
+        requestBody.faqContext = faqContext
      }

      const res = await fetch('/api/chat', {
@@ -7,11 +7,19 @@ import { PRESENTER_FAQ } from './presenter-faq'
 * Returns the best match if score exceeds threshold, or null for LLM fallback.
 */
 export function matchFAQ(query: string, lang: Language): FAQEntry | null {
+  const matches = matchFAQMultiple(query, lang, 1)
+  return matches.length > 0 ? matches[0] : null
+}
+
+/**
+ * Match a user query and return the top N relevant FAQ entries as context.
+ * Used to feed multiple relevant FAQs into the LLM prompt.
+ */
+export function matchFAQMultiple(query: string, lang: Language, maxResults: number = 3): FAQEntry[] {
  const normalized = query.toLowerCase().trim()
  const queryWords = normalized.split(/\s+/)

-  let bestMatch: FAQEntry | null = null
-  let bestScore = 0
+  const scored: { entry: FAQEntry; score: number }[] = []

  for (const entry of PRESENTER_FAQ) {
    let score = 0
@@ -20,23 +28,20 @@ export function matchFAQ(query: string, lang: Language): FAQEntry | null {
    for (const keyword of entry.keywords) {
      const kwLower = keyword.toLowerCase()
      if (kwLower.includes(' ')) {
-        // Multi-word keyword: check if phrase appears in query
        if (normalized.includes(kwLower)) {
          score += 3 * entry.priority / 10
        }
      } else {
-        // Single keyword: check word-level match
        if (queryWords.some(w => w === kwLower || w.startsWith(kwLower) || kwLower.startsWith(w))) {
          score += 1
        }
-        // Also check if keyword appears anywhere in query (partial match)
        if (normalized.includes(kwLower)) {
          score += 0.5
        }
      }
    }

-    // Check if query matches the question text closely
+    // Check question text overlap
    const questionText = lang === 'de' ? entry.question_de : entry.question_en
    const questionWords = questionText.toLowerCase().split(/\s+/)
    const overlapCount = queryWords.filter(w =>
@@ -46,22 +51,16 @@ export function matchFAQ(query: string, lang: Language): FAQEntry | null {
      score += overlapCount * 0.5
    }

-    // Weight by priority
    score *= (entry.priority / 10)

-    if (score > bestScore) {
-      bestScore = score
-      bestMatch = entry
+    if (score >= 1.0) {
+      scored.push({ entry, score })
    }
  }

-  // Threshold: need meaningful match to avoid false positives
-  // Require at least 2 keyword hits or strong phrase match
-  if (bestScore < 1.5) {
-    return null
-  }
-
-  return bestMatch
+  // Sort by score descending, return top N
+  scored.sort((a, b) => b.score - a.score)
+  return scored.slice(0, maxResults).map(s => s.entry)
 }

 /**
@@ -70,3 +69,18 @@ export function matchFAQ(query: string, lang: Language): FAQEntry | null {
 export function getFAQAnswer(entry: FAQEntry, lang: Language): string {
  return lang === 'de' ? entry.answer_de : entry.answer_en
 }
+
+/**
+ * Build a context string from multiple FAQ matches for LLM injection
+ */
+export function buildFAQContext(entries: FAQEntry[], lang: Language): string {
+  if (entries.length === 0) return ''
+
+  const parts = entries.map((entry, idx) => {
+    const q = lang === 'de' ? entry.question_de : entry.question_en
+    const a = lang === 'de' ? entry.answer_de : entry.answer_en
+    return `### Relevante Information ${idx + 1}: ${q}\n${a}`
+  })
+
+  return `\n\n## Vorrecherchierte Antworten (nutze diese als Basis, kombiniere bei Bedarf)\n${parts.join('\n\n')}\n\nWICHTIG: Formuliere die Antwort in deinen eigenen Worten als natürlichen Fließtext. Kombiniere die Informationen wenn die Frage mehrere Themen berührt. Antworte nicht mit Bulletlisten.`
+}