feat(training): add Media Pipeline — TTS Audio, Presentation Video, Bulk Generation

Phase A: 8 new IT-Security training modules (SEC-PWD, SEC-DESK, SEC-KIAI, SEC-BYOD, SEC-VIDEO, SEC-USB, SEC-INC, SEC-HOME) with CTM entries. Bulk content and quiz generation endpoints for all 28 modules. Phase B: Piper TTS service (Python/FastAPI) for local German speech synthesis. training_media table, TTSClient in Go backend, audio generation endpoints, AudioPlayer component in frontend. MinIO storage integration. Phase C: FFmpeg presentation video pipeline — LLM generates slide scripts, ImageMagick renders 1920x1080 slides, FFmpeg combines with audio to MP4. VideoPlayer and ScriptPreview components in frontend. New files: 15 created, 9 modified - compliance-tts-service/ (Dockerfile, main.py, tts_engine.py, storage.py, slide_renderer.py, video_generator.py) - migrations 014-016 (training engine, IT-security modules, media table) - training package (models, store, content_generator, media, handlers) - frontend (AudioPlayer, VideoPlayer, ScriptPreview, api, types, page) Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-16 21:42:33 +01:00
parent fba4c411dc
commit 375914e568
28 changed files with 7015 additions and 0 deletions
@@ -0,0 +1,175 @@
+"""Compliance TTS Service — Piper TTS + FFmpeg Audio/Video Pipeline."""
+import logging
+import os
+import tempfile
+import uuid
+
+from fastapi import FastAPI, HTTPException
+from pydantic import BaseModel
+
+from storage import StorageClient
+from tts_engine import PiperTTS
+
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+
+app = FastAPI(title="Compliance TTS Service", version="1.0.0")
+
+# Configuration
+MINIO_ENDPOINT = os.getenv("MINIO_ENDPOINT", "bp-core-minio:9000")
+MINIO_ACCESS_KEY = os.getenv("MINIO_ACCESS_KEY", "breakpilot")
+MINIO_SECRET_KEY = os.getenv("MINIO_SECRET_KEY", "breakpilot123")
+PIPER_MODEL_PATH = os.getenv("PIPER_MODEL_PATH", "/app/models/de_DE-thorsten-high.onnx")
+
+AUDIO_BUCKET = "compliance-training-audio"
+VIDEO_BUCKET = "compliance-training-video"
+
+# Initialize services
+storage = StorageClient(MINIO_ENDPOINT, MINIO_ACCESS_KEY, MINIO_SECRET_KEY)
+tts = PiperTTS(PIPER_MODEL_PATH)
+
+
+@app.on_event("startup")
+async def startup():
+    """Ensure buckets exist on startup."""
+    storage.ensure_bucket(AUDIO_BUCKET)
+    storage.ensure_bucket(VIDEO_BUCKET)
+    logger.info("TTS Service started")
+
+
+# --- Models ---
+
+class SynthesizeRequest(BaseModel):
+    text: str
+    language: str = "de"
+    voice: str = "thorsten-high"
+    module_id: str
+    content_id: str | None = None
+
+
+class SynthesizeResponse(BaseModel):
+    audio_id: str
+    bucket: str
+    object_key: str
+    duration_seconds: float
+    size_bytes: int
+
+
+class GenerateVideoRequest(BaseModel):
+    script: dict
+    audio_object_key: str
+    module_id: str
+
+
+class GenerateVideoResponse(BaseModel):
+    video_id: str
+    bucket: str
+    object_key: str
+    duration_seconds: float
+    size_bytes: int
+
+
+class VoiceInfo(BaseModel):
+    id: str
+    language: str
+    name: str
+    quality: str
+
+
+# --- Endpoints ---
+
+@app.get("/health")
+async def health():
+    """Health check endpoint."""
+    return {
+        "status": "healthy",
+        "piper_available": tts.is_available,
+        "ffmpeg_available": _check_ffmpeg(),
+        "minio_connected": storage.is_connected(),
+    }
+
+
+@app.get("/voices")
+async def list_voices():
+    """List available TTS voices."""
+    return {
+        "voices": [
+            VoiceInfo(
+                id="de_DE-thorsten-high",
+                language="de",
+                name="Thorsten (High Quality)",
+                quality="high",
+            ),
+        ],
+    }
+
+
+@app.post("/synthesize", response_model=SynthesizeResponse)
+async def synthesize(req: SynthesizeRequest):
+    """Synthesize text to audio and upload to storage."""
+    if not req.text.strip():
+        raise HTTPException(status_code=400, detail="Text is empty")
+
+    audio_id = str(uuid.uuid4())
+    content_suffix = req.content_id or "full"
+    object_key = f"audio/{req.module_id}/{content_suffix}.mp3"
+
+    with tempfile.TemporaryDirectory() as tmpdir:
+        try:
+            mp3_path, duration = tts.synthesize_to_mp3(req.text, tmpdir)
+            size_bytes = storage.upload_file(AUDIO_BUCKET, object_key, mp3_path, "audio/mpeg")
+        except Exception as e:
+            logger.error(f"Synthesis failed: {e}")
+            raise HTTPException(status_code=500, detail=str(e))
+
+    return SynthesizeResponse(
+        audio_id=audio_id,
+        bucket=AUDIO_BUCKET,
+        object_key=object_key,
+        duration_seconds=round(duration, 2),
+        size_bytes=size_bytes,
+    )
+
+
+@app.post("/generate-video", response_model=GenerateVideoResponse)
+async def generate_video(req: GenerateVideoRequest):
+    """Generate a presentation video from slides + audio."""
+    try:
+        from video_generator import generate_presentation_video
+    except ImportError:
+        raise HTTPException(status_code=501, detail="Video generation not available yet")
+
+    video_id = str(uuid.uuid4())
+    object_key = f"video/{req.module_id}/presentation.mp4"
+
+    with tempfile.TemporaryDirectory() as tmpdir:
+        try:
+            mp4_path, duration = generate_presentation_video(
+                script=req.script,
+                audio_object_key=req.audio_object_key,
+                output_dir=tmpdir,
+                storage=storage,
+                audio_bucket=AUDIO_BUCKET,
+            )
+            size_bytes = storage.upload_file(VIDEO_BUCKET, object_key, mp4_path, "video/mp4")
+        except Exception as e:
+            logger.error(f"Video generation failed: {e}")
+            raise HTTPException(status_code=500, detail=str(e))
+
+    return GenerateVideoResponse(
+        video_id=video_id,
+        bucket=VIDEO_BUCKET,
+        object_key=object_key,
+        duration_seconds=round(duration, 2),
+        size_bytes=size_bytes,
+    )
+
+
+def _check_ffmpeg() -> bool:
+    """Check if ffmpeg is available."""
+    import subprocess
+    try:
+        subprocess.run(["ffmpeg", "-version"], capture_output=True, timeout=5)
+        return True
+    except Exception:
+        return False