feat(training): add Media Pipeline — TTS Audio, Presentation Video, Bulk Generation
All checks were successful
CI / go-lint (push) Has been skipped
CI / python-lint (push) Has been skipped
CI / nodejs-lint (push) Has been skipped
CI / test-go-ai-compliance (push) Successful in 36s
CI / test-python-backend-compliance (push) Successful in 31s
CI / test-python-document-crawler (push) Successful in 23s
CI / test-python-dsms-gateway (push) Successful in 21s
All checks were successful
CI / go-lint (push) Has been skipped
CI / python-lint (push) Has been skipped
CI / nodejs-lint (push) Has been skipped
CI / test-go-ai-compliance (push) Successful in 36s
CI / test-python-backend-compliance (push) Successful in 31s
CI / test-python-document-crawler (push) Successful in 23s
CI / test-python-dsms-gateway (push) Successful in 21s
Phase A: 8 new IT-Security training modules (SEC-PWD, SEC-DESK, SEC-KIAI, SEC-BYOD, SEC-VIDEO, SEC-USB, SEC-INC, SEC-HOME) with CTM entries. Bulk content and quiz generation endpoints for all 28 modules. Phase B: Piper TTS service (Python/FastAPI) for local German speech synthesis. training_media table, TTSClient in Go backend, audio generation endpoints, AudioPlayer component in frontend. MinIO storage integration. Phase C: FFmpeg presentation video pipeline — LLM generates slide scripts, ImageMagick renders 1920x1080 slides, FFmpeg combines with audio to MP4. VideoPlayer and ScriptPreview components in frontend. New files: 15 created, 9 modified - compliance-tts-service/ (Dockerfile, main.py, tts_engine.py, storage.py, slide_renderer.py, video_generator.py) - migrations 014-016 (training engine, IT-security modules, media table) - training package (models, store, content_generator, media, handlers) - frontend (AudioPlayer, VideoPlayer, ScriptPreview, api, types, page) Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
175
compliance-tts-service/main.py
Normal file
175
compliance-tts-service/main.py
Normal file
@@ -0,0 +1,175 @@
|
||||
"""Compliance TTS Service — Piper TTS + FFmpeg Audio/Video Pipeline."""
|
||||
import logging
|
||||
import os
|
||||
import tempfile
|
||||
import uuid
|
||||
|
||||
from fastapi import FastAPI, HTTPException
|
||||
from pydantic import BaseModel
|
||||
|
||||
from storage import StorageClient
|
||||
from tts_engine import PiperTTS
|
||||
|
||||
logging.basicConfig(level=logging.INFO)
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
app = FastAPI(title="Compliance TTS Service", version="1.0.0")
|
||||
|
||||
# Configuration
|
||||
MINIO_ENDPOINT = os.getenv("MINIO_ENDPOINT", "bp-core-minio:9000")
|
||||
MINIO_ACCESS_KEY = os.getenv("MINIO_ACCESS_KEY", "breakpilot")
|
||||
MINIO_SECRET_KEY = os.getenv("MINIO_SECRET_KEY", "breakpilot123")
|
||||
PIPER_MODEL_PATH = os.getenv("PIPER_MODEL_PATH", "/app/models/de_DE-thorsten-high.onnx")
|
||||
|
||||
AUDIO_BUCKET = "compliance-training-audio"
|
||||
VIDEO_BUCKET = "compliance-training-video"
|
||||
|
||||
# Initialize services
|
||||
storage = StorageClient(MINIO_ENDPOINT, MINIO_ACCESS_KEY, MINIO_SECRET_KEY)
|
||||
tts = PiperTTS(PIPER_MODEL_PATH)
|
||||
|
||||
|
||||
@app.on_event("startup")
|
||||
async def startup():
|
||||
"""Ensure buckets exist on startup."""
|
||||
storage.ensure_bucket(AUDIO_BUCKET)
|
||||
storage.ensure_bucket(VIDEO_BUCKET)
|
||||
logger.info("TTS Service started")
|
||||
|
||||
|
||||
# --- Models ---
|
||||
|
||||
class SynthesizeRequest(BaseModel):
|
||||
text: str
|
||||
language: str = "de"
|
||||
voice: str = "thorsten-high"
|
||||
module_id: str
|
||||
content_id: str | None = None
|
||||
|
||||
|
||||
class SynthesizeResponse(BaseModel):
|
||||
audio_id: str
|
||||
bucket: str
|
||||
object_key: str
|
||||
duration_seconds: float
|
||||
size_bytes: int
|
||||
|
||||
|
||||
class GenerateVideoRequest(BaseModel):
|
||||
script: dict
|
||||
audio_object_key: str
|
||||
module_id: str
|
||||
|
||||
|
||||
class GenerateVideoResponse(BaseModel):
|
||||
video_id: str
|
||||
bucket: str
|
||||
object_key: str
|
||||
duration_seconds: float
|
||||
size_bytes: int
|
||||
|
||||
|
||||
class VoiceInfo(BaseModel):
|
||||
id: str
|
||||
language: str
|
||||
name: str
|
||||
quality: str
|
||||
|
||||
|
||||
# --- Endpoints ---
|
||||
|
||||
@app.get("/health")
|
||||
async def health():
|
||||
"""Health check endpoint."""
|
||||
return {
|
||||
"status": "healthy",
|
||||
"piper_available": tts.is_available,
|
||||
"ffmpeg_available": _check_ffmpeg(),
|
||||
"minio_connected": storage.is_connected(),
|
||||
}
|
||||
|
||||
|
||||
@app.get("/voices")
|
||||
async def list_voices():
|
||||
"""List available TTS voices."""
|
||||
return {
|
||||
"voices": [
|
||||
VoiceInfo(
|
||||
id="de_DE-thorsten-high",
|
||||
language="de",
|
||||
name="Thorsten (High Quality)",
|
||||
quality="high",
|
||||
),
|
||||
],
|
||||
}
|
||||
|
||||
|
||||
@app.post("/synthesize", response_model=SynthesizeResponse)
|
||||
async def synthesize(req: SynthesizeRequest):
|
||||
"""Synthesize text to audio and upload to storage."""
|
||||
if not req.text.strip():
|
||||
raise HTTPException(status_code=400, detail="Text is empty")
|
||||
|
||||
audio_id = str(uuid.uuid4())
|
||||
content_suffix = req.content_id or "full"
|
||||
object_key = f"audio/{req.module_id}/{content_suffix}.mp3"
|
||||
|
||||
with tempfile.TemporaryDirectory() as tmpdir:
|
||||
try:
|
||||
mp3_path, duration = tts.synthesize_to_mp3(req.text, tmpdir)
|
||||
size_bytes = storage.upload_file(AUDIO_BUCKET, object_key, mp3_path, "audio/mpeg")
|
||||
except Exception as e:
|
||||
logger.error(f"Synthesis failed: {e}")
|
||||
raise HTTPException(status_code=500, detail=str(e))
|
||||
|
||||
return SynthesizeResponse(
|
||||
audio_id=audio_id,
|
||||
bucket=AUDIO_BUCKET,
|
||||
object_key=object_key,
|
||||
duration_seconds=round(duration, 2),
|
||||
size_bytes=size_bytes,
|
||||
)
|
||||
|
||||
|
||||
@app.post("/generate-video", response_model=GenerateVideoResponse)
|
||||
async def generate_video(req: GenerateVideoRequest):
|
||||
"""Generate a presentation video from slides + audio."""
|
||||
try:
|
||||
from video_generator import generate_presentation_video
|
||||
except ImportError:
|
||||
raise HTTPException(status_code=501, detail="Video generation not available yet")
|
||||
|
||||
video_id = str(uuid.uuid4())
|
||||
object_key = f"video/{req.module_id}/presentation.mp4"
|
||||
|
||||
with tempfile.TemporaryDirectory() as tmpdir:
|
||||
try:
|
||||
mp4_path, duration = generate_presentation_video(
|
||||
script=req.script,
|
||||
audio_object_key=req.audio_object_key,
|
||||
output_dir=tmpdir,
|
||||
storage=storage,
|
||||
audio_bucket=AUDIO_BUCKET,
|
||||
)
|
||||
size_bytes = storage.upload_file(VIDEO_BUCKET, object_key, mp4_path, "video/mp4")
|
||||
except Exception as e:
|
||||
logger.error(f"Video generation failed: {e}")
|
||||
raise HTTPException(status_code=500, detail=str(e))
|
||||
|
||||
return GenerateVideoResponse(
|
||||
video_id=video_id,
|
||||
bucket=VIDEO_BUCKET,
|
||||
object_key=object_key,
|
||||
duration_seconds=round(duration, 2),
|
||||
size_bytes=size_bytes,
|
||||
)
|
||||
|
||||
|
||||
def _check_ffmpeg() -> bool:
|
||||
"""Check if ffmpeg is available."""
|
||||
import subprocess
|
||||
try:
|
||||
subprocess.run(["ffmpeg", "-version"], capture_output=True, timeout=5)
|
||||
return True
|
||||
except Exception:
|
||||
return False
|
||||
Reference in New Issue
Block a user