breakpilot-compliance/backend-compliance/compliance/knowledge_production/schemas.py

"""Schemas for Knowledge Production — deterministic draft assembly + lifecycle.

The corpus is no longer written by hand: it is deterministically PREPARED from data the software
already owns (Capability, Transition Pattern, Controls, Evidence, leverage), then curated by an
expert. A `PlaybookDraft` is a machine-assembled skeleton with per-field provenance and an explicit
TODO list of what still needs human (or offline-propose) input. No LLM in the deterministic core.
Python 3.9 compatible (no `|` unions).
"""

from __future__ import annotations

from enum import Enum
from typing import Dict, List

from pydantic import BaseModel, Field


class DraftStatus(str, Enum):
    """Freigabestatus — the knowledge lifecycle from machine draft to proven (mirrors the
    transition-pattern / playbook maturity, with a machine-assembled pre-stage)."""

    DRAFT_GENERATED = "draft_generated"   # machine-assembled, NOT yet expert-touched
    IN_REVIEW = "in_review"               # an expert is curating it
    REVIEWED = "reviewed"                 # internally reviewed
    VALIDATED = "validated"               # domain expert confirmed
    PROVEN = "proven"                     # confirmed in the field


class PlaybookDraft(BaseModel):
    """A deterministically assembled playbook draft for one capability.

    Owned fields (why / closes_regulations / expected_evidence / typical_controls) are filled from
    existing data with provenance; the practitioner know-how (tools / process_steps / how_others)
    is left as TODO. The expert reviews a draft instead of writing from a blank page.
    """

    capability_id: str
    status: DraftStatus = DraftStatus.DRAFT_GENERATED
    title: str = ""
    why: str = ""                                          # from the transition pattern (why_asked/missing_because)
    closes_regulations: List[str] = Field(default_factory=list)   # from leverage (covers_targets)
    expected_evidence: List[str] = Field(default_factory=list)    # from the transition pattern
    typical_controls: List[str] = Field(default_factory=list)     # injected from Execution (may be empty)
    provenance: Dict[str, str] = Field(default_factory=dict)      # field -> source it was assembled from
    todo: List[str] = Field(default_factory=list)          # fields the expert/offline-propose must still add
    disclaimer: str = ""                                   # machine draft, requires expert curation