This repository has been archived on 2026-02-15. You can view files and clone it. You cannot open issues or pull requests or push a commit.
Files
breakpilot-pwa/voice-service/models/session.py
Benjamin Admin bfdaf63ba9 fix: Restore all files lost during destructive rebase
A previous `git pull --rebase origin main` dropped 177 local commits,
losing 3400+ files across admin-v2, backend, studio-v2, website,
klausur-service, and many other services. The partial restore attempt
(660295e2) only recovered some files.

This commit restores all missing files from pre-rebase ref 98933f5e
while preserving post-rebase additions (night-scheduler, night-mode UI,
NightModeWidget dashboard integration).

Restored features include:
- AI Module Sidebar (FAB), OCR Labeling, OCR Compare
- GPU Dashboard, RAG Pipeline, Magic Help
- Klausur-Korrektur (8 files), Abitur-Archiv (5+ files)
- Companion, Zeugnisse-Crawler, Screen Flow
- Full backend, studio-v2, website, klausur-service
- All compliance SDKs, agent-core, voice-service
- CI/CD configs, documentation, scripts

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-09 09:51:32 +01:00

153 lines
5.1 KiB
Python

"""
Voice Session Models
Transient session management - no persistent storage of audio data
DSGVO Compliance:
- Sessions are RAM-only
- Audio chunks are processed and discarded
- Transcripts are encrypted before any storage
"""
from datetime import datetime
from enum import Enum
from typing import Optional, List, Dict, Any
from pydantic import BaseModel, Field
import uuid
class SessionStatus(str, Enum):
"""Voice session status."""
CREATED = "created"
CONNECTED = "connected"
LISTENING = "listening"
PROCESSING = "processing"
RESPONDING = "responding"
PAUSED = "paused"
CLOSED = "closed"
ERROR = "error"
class AudioChunk(BaseModel):
"""
Audio chunk for streaming.
NEVER persisted - only exists in RAM during processing.
"""
sequence: int = Field(..., description="Chunk sequence number")
timestamp_ms: int = Field(..., description="Timestamp in milliseconds")
data: bytes = Field(..., description="PCM audio data (Int16, 24kHz)")
duration_ms: int = Field(default=80, description="Chunk duration in ms")
class Config:
# Exclude from serialization to prevent accidental logging
json_encoders = {
bytes: lambda v: f"<audio:{len(v)} bytes>"
}
class TranscriptMessage(BaseModel):
"""
Transcript message - encrypted before storage.
"""
id: str = Field(default_factory=lambda: str(uuid.uuid4()))
role: str = Field(..., description="'user' or 'assistant'")
content: str = Field(..., description="Transcript text (plaintext in RAM only)")
timestamp: datetime = Field(default_factory=datetime.utcnow)
confidence: Optional[float] = Field(default=None, description="ASR confidence 0-1")
intent: Optional[str] = Field(default=None, description="Detected intent")
encrypted_ref: Optional[str] = Field(default=None, description="Encrypted storage reference")
class Config:
json_schema_extra = {
"example": {
"id": "msg-123",
"role": "user",
"content": "Notiz zu Max: heute wiederholt gestoert",
"timestamp": "2026-01-26T10:30:00Z",
"confidence": 0.95,
"intent": "student_observation",
}
}
class VoiceSession(BaseModel):
"""
Voice session state.
Stored in Valkey with TTL, never in persistent storage.
"""
id: str = Field(default_factory=lambda: str(uuid.uuid4()))
namespace_id: str = Field(..., description="Teacher namespace ID")
key_hash: str = Field(..., description="Hash of client-side encryption key")
status: SessionStatus = Field(default=SessionStatus.CREATED)
created_at: datetime = Field(default_factory=datetime.utcnow)
last_activity: datetime = Field(default_factory=datetime.utcnow)
# Conversation state (transient)
messages: List[TranscriptMessage] = Field(default_factory=list)
pending_tasks: List[str] = Field(default_factory=list, description="Task IDs")
# Audio state (never persisted)
audio_chunks_received: int = Field(default=0)
audio_chunks_processed: int = Field(default=0)
# Metadata (no PII)
device_type: Optional[str] = Field(default=None, description="'pwa' or 'app'")
client_version: Optional[str] = Field(default=None)
def update_activity(self):
"""Update last activity timestamp."""
self.last_activity = datetime.utcnow()
class Config:
json_schema_extra = {
"example": {
"id": "session-abc123",
"namespace_id": "teacher-ns-456",
"key_hash": "sha256:abc...",
"status": "listening",
"created_at": "2026-01-26T10:00:00Z",
"last_activity": "2026-01-26T10:30:00Z",
"messages": [],
"pending_tasks": [],
"audio_chunks_received": 150,
"audio_chunks_processed": 150,
"device_type": "pwa",
}
}
class SessionCreate(BaseModel):
"""Request to create a new voice session."""
namespace_id: str = Field(..., description="Teacher namespace ID")
key_hash: str = Field(..., description="Hash of client-side encryption key")
device_type: Optional[str] = Field(default="pwa")
client_version: Optional[str] = Field(default=None)
class Config:
json_schema_extra = {
"example": {
"namespace_id": "teacher-ns-456",
"key_hash": "sha256:abc123def456...",
"device_type": "pwa",
"client_version": "1.0.0",
}
}
class SessionResponse(BaseModel):
"""Response after session creation."""
id: str
namespace_id: str
status: SessionStatus
created_at: datetime
websocket_url: str = Field(..., description="WebSocket URL for audio streaming")
class Config:
json_schema_extra = {
"example": {
"id": "session-abc123",
"namespace_id": "teacher-ns-456",
"status": "created",
"created_at": "2026-01-26T10:00:00Z",
"websocket_url": "ws://localhost:8091/ws/voice?session_id=session-abc123",
}
}