457 lines
15 KiB
Go
457 lines
15 KiB
Go
package handlers
|
|
|
|
import (
|
|
"encoding/json"
|
|
"fmt"
|
|
"log"
|
|
"net/http"
|
|
"strconv"
|
|
|
|
"github.com/breakpilot/ai-compliance-sdk/internal/ucca"
|
|
"github.com/gin-gonic/gin"
|
|
)
|
|
|
|
// RAGHandlers handles RAG search API endpoints.
|
|
type RAGHandlers struct {
|
|
ragClient *ucca.LegalRAGClient
|
|
corpusVersionStore *ucca.CorpusVersionStore
|
|
}
|
|
|
|
// NewRAGHandlers creates new RAG handlers.
|
|
func NewRAGHandlers(corpusVersionStore *ucca.CorpusVersionStore) *RAGHandlers {
|
|
return &RAGHandlers{
|
|
ragClient: ucca.NewLegalRAGClient(),
|
|
corpusVersionStore: corpusVersionStore,
|
|
}
|
|
}
|
|
|
|
// AllowedCollections is the whitelist of Qdrant collections that can be queried.
|
|
var AllowedCollections = map[string]bool{
|
|
"bp_compliance_ce": true,
|
|
"bp_compliance_gesetze": true,
|
|
"bp_compliance_datenschutz": true,
|
|
"bp_compliance_recht": true,
|
|
"bp_compliance_gdpr": true,
|
|
"bp_dsfa_corpus": true,
|
|
"bp_dsfa_templates": true,
|
|
"bp_dsfa_risks": true,
|
|
"bp_legal_templates": true,
|
|
"bp_iace_libraries": true,
|
|
"bp_iace_accident_stats": true,
|
|
"bp_iace_safety_kb": true,
|
|
"bp_iace_fmea_kb": true,
|
|
}
|
|
|
|
// SearchRequest represents a RAG search request.
|
|
type SearchRequest struct {
|
|
Query string `json:"query" binding:"required"`
|
|
Collection string `json:"collection,omitempty"`
|
|
Regulations []string `json:"regulations,omitempty"`
|
|
TopK int `json:"top_k,omitempty"`
|
|
}
|
|
|
|
// Search performs a semantic search across the compliance regulation corpus.
|
|
// POST /sdk/v1/rag/search
|
|
func (h *RAGHandlers) Search(c *gin.Context) {
|
|
var req SearchRequest
|
|
if err := c.ShouldBindJSON(&req); err != nil {
|
|
c.JSON(http.StatusBadRequest, gin.H{"error": err.Error()})
|
|
return
|
|
}
|
|
|
|
if req.TopK <= 0 || req.TopK > 20 {
|
|
req.TopK = 5
|
|
}
|
|
|
|
// Validate collection if specified
|
|
if req.Collection != "" {
|
|
if !AllowedCollections[req.Collection] {
|
|
c.JSON(http.StatusBadRequest, gin.H{"error": "Unknown collection: " + req.Collection + ". Allowed: bp_compliance_ce, bp_compliance_recht, bp_compliance_gesetze, bp_compliance_datenschutz, bp_dsfa_corpus, bp_legal_templates"})
|
|
return
|
|
}
|
|
}
|
|
|
|
results, err := h.ragClient.SearchCollection(c.Request.Context(), req.Collection, req.Query, req.Regulations, req.TopK)
|
|
if err != nil {
|
|
c.JSON(http.StatusInternalServerError, gin.H{"error": "RAG search failed: " + err.Error()})
|
|
return
|
|
}
|
|
|
|
c.JSON(http.StatusOK, gin.H{
|
|
"query": req.Query,
|
|
"results": results,
|
|
"count": len(results),
|
|
"assessment": ucca.Assess(results),
|
|
})
|
|
}
|
|
|
|
// RetrieveRequest is the Authority Router request: a query only, no collection — the router decides
|
|
// which collections to query (broad authority base + the in-scope KB-2026.1 slice).
|
|
type RetrieveRequest struct {
|
|
Query string `json:"query" binding:"required"`
|
|
TopK int `json:"top_k,omitempty"`
|
|
Context string `json:"context,omitempty"`
|
|
}
|
|
|
|
// Retrieve is the Authority Router endpoint. The Advisor calls this with ONLY a query and stays
|
|
// collection-agnostic; the router fans out over the authority base + the in-scope slice, merges by
|
|
// authority score, and returns the unified top-K. Response shape matches Search (query/results/
|
|
// count/assessment) so existing consumers parse it unchanged.
|
|
// POST /sdk/v1/rag/retrieve
|
|
func (h *RAGHandlers) Retrieve(c *gin.Context) {
|
|
var req RetrieveRequest
|
|
if err := c.ShouldBindJSON(&req); err != nil {
|
|
c.JSON(http.StatusBadRequest, gin.H{"error": err.Error()})
|
|
return
|
|
}
|
|
|
|
if req.TopK <= 0 || req.TopK > 20 {
|
|
req.TopK = 8
|
|
}
|
|
|
|
// E2 Term Resolution: expand unambiguous abbreviations (TOM/VVT/AVV/DSB/DSFA) into the
|
|
// query so retrieval finds them; ambiguous ones (DSE/DPA) are surfaced to the FE — NOT
|
|
// auto-mapped (chat context E1 wins, else the FE asks).
|
|
intent := ucca.DetectIntent(req.Query)
|
|
termRes := ucca.ResolveAbbreviations(req.Query)
|
|
req.Query = termRes.Expanded
|
|
|
|
results, err := h.ragClient.Retrieve(c.Request.Context(), req.Query, req.TopK)
|
|
if err != nil {
|
|
c.JSON(http.StatusInternalServerError, gin.H{"error": "RAG retrieve failed: " + err.Error()})
|
|
return
|
|
}
|
|
|
|
// Evidence-Type-Schicht: die autoritative typisierte Evidence (Fußnoten/Tabellen/Figuren) aus
|
|
// dem KB-Wissensraum SEPARAT surfacen, statt sie im Breit-Basis-Text-Merge zu verlieren.
|
|
// results[] bleibt der Text-Kontext fürs LLM + die Quellen-Liste.
|
|
// Context scoping (E5): the user explicitly chose a knowledge space (chip), so scope
|
|
// the evidence HARD to it (wider re-retrieve + domain filter) — no off-domain regelwerke
|
|
// (MDR/UStG/eIDAS) after a context decision.
|
|
if req.Context != "" {
|
|
if wide, werr := h.ragClient.Retrieve(c.Request.Context(), req.Query, 30); werr == nil && len(wide) > 0 {
|
|
results = ucca.FilterByKnowledgeSpace(wide, req.Context, req.TopK)
|
|
} else {
|
|
results = ucca.FilterByKnowledgeSpace(results, req.Context, req.TopK)
|
|
}
|
|
}
|
|
|
|
// G1 scope-gating: a named regulation scopes the evidence to its knowledge space.
|
|
// Re-retrieve wider and lead with the named regulation's domain so the L2 answer +
|
|
// [n] citations are built on scoped evidence, not the embedding-majority domain.
|
|
if scope := ucca.QueryKnowledgeSpace(req.Query); scope != "" {
|
|
if wide, werr := h.ragClient.Retrieve(c.Request.Context(), req.Query, 30); werr == nil && len(wide) > 0 {
|
|
results = ucca.ScopeResults(wide, scope, req.TopK)
|
|
} else {
|
|
results = ucca.ScopeResults(results, scope, req.TopK)
|
|
}
|
|
}
|
|
|
|
ev := h.ragClient.RetrieveEvidence(c.Request.Context(), req.Query)
|
|
// Concept->Norm recall injector: if the query names a legal concept, fetch its
|
|
// load-bearing norms (Datenschutzerklärung -> Art. 12/13/14 DSGVO, ...) and inject
|
|
// them into the evidence set so they surface (embedding similarity misses them).
|
|
if norms := ucca.ConceptNorms(req.Query); len(norms) > 0 {
|
|
top := 0.9
|
|
if len(results) > 0 {
|
|
top = results[0].Score
|
|
}
|
|
injected := h.ragClient.FetchByNormIDs(c.Request.Context(), norms, top-0.001)
|
|
results = ucca.InjectConceptNorms(results, injected, req.TopK)
|
|
}
|
|
clarity := ucca.ClassifyClarity(req.Query, results)
|
|
traceClarity(req.Query, clarity, results)
|
|
|
|
c.JSON(http.StatusOK, gin.H{
|
|
"query": req.Query,
|
|
"results": results,
|
|
"count": len(results),
|
|
"assessment": ucca.Assess(results),
|
|
"footnotes": footnotesFromEvidence(ev[ucca.EvidenceFootnote]),
|
|
"tables": tablesFromEvidence(ev[ucca.EvidenceTable]),
|
|
"evidence": evidenceFromResults(results),
|
|
"visual_evidence": visualEvidenceFromEvidence(ev[ucca.EvidenceFigure]),
|
|
"clarity": clarity,
|
|
"term_resolution": termRes.Ambiguous,
|
|
"interaction_intent": intent,
|
|
})
|
|
}
|
|
|
|
// footnotesFromEvidence maps FOOTNOTE evidence to the Evidence-Workspace RawFootnote shape.
|
|
func footnotesFromEvidence(rs []ucca.LegalSearchResult) []gin.H {
|
|
out := make([]gin.H, 0, len(rs))
|
|
for _, r := range rs {
|
|
out = append(out, gin.H{
|
|
"id": r.CitationUnit,
|
|
"ref": r.CitationUnit,
|
|
"number": r.FootnoteLabel,
|
|
"regulation_code": r.RegulationCode,
|
|
"regulation_short": r.RegulationShort,
|
|
"regulation_name": r.RegulationName,
|
|
"section": r.RefCitationUnit,
|
|
"text": r.FootnoteVerbatim,
|
|
})
|
|
}
|
|
return out
|
|
}
|
|
|
|
// tablesFromEvidence maps TABLE evidence (C6/C9). Key is present so the same Evidence-Type path
|
|
// carries tables the moment the UI adds a table section.
|
|
func tablesFromEvidence(rs []ucca.LegalSearchResult) []gin.H {
|
|
out := make([]gin.H, 0, len(rs))
|
|
for _, r := range rs {
|
|
out = append(out, gin.H{
|
|
"id": r.CitationUnit,
|
|
"caption": r.ArticleLabel,
|
|
"regulation_code": r.RegulationCode,
|
|
"regulation_short": r.RegulationShort,
|
|
"regulation_name": r.RegulationName,
|
|
"section": r.RefCitationUnit,
|
|
"text": r.Text,
|
|
})
|
|
}
|
|
return out
|
|
}
|
|
|
|
// visualEvidenceFromEvidence maps FIGURE evidence to the Visual Evidence contract shape
|
|
// (C8). visual_type/image_ref/vision_summary populate once C8 lands; the shape is stable now.
|
|
func visualEvidenceFromEvidence(rs []ucca.LegalSearchResult) []gin.H {
|
|
out := make([]gin.H, 0, len(rs))
|
|
for _, r := range rs {
|
|
out = append(out, gin.H{
|
|
"visual_id": r.CitationUnit,
|
|
"visual_type": "figure",
|
|
"caption": r.ArticleLabel,
|
|
"document": evidenceDocName(r),
|
|
"context": ucca.KnowledgeSpaceOf(r.RegulationCode),
|
|
"regulation_code": r.RegulationCode,
|
|
"section": r.RefCitationUnit,
|
|
"image_ref": "",
|
|
"vision_summary": "",
|
|
})
|
|
}
|
|
return out
|
|
}
|
|
|
|
// evidenceFromResults maps retrieval hits to the Evidence contract shape the Advisor
|
|
// Evidence Workspace renders (citations[] reference evidence_id). Populated at retrieve
|
|
// time; citations[] (the [n]<->evidence coupling) come from the answer-generation step.
|
|
func evidenceFromResults(rs []ucca.LegalSearchResult) []gin.H {
|
|
out := make([]gin.H, 0, len(rs))
|
|
for _, r := range rs {
|
|
id := r.CitationUnit
|
|
if id == "" {
|
|
id = r.ArticleLabel
|
|
}
|
|
out = append(out, gin.H{
|
|
"evidence_id": id,
|
|
"document": evidenceDocName(r),
|
|
"section": r.ArticleLabel,
|
|
"paragraph": r.Paragraph,
|
|
"snippet": evidenceSnippet(r.Text, 280),
|
|
"url": r.SourceURL,
|
|
"regulation_code": r.RegulationCode,
|
|
"context": ucca.KnowledgeSpaceOf(r.RegulationCode),
|
|
})
|
|
}
|
|
return out
|
|
}
|
|
|
|
// evidenceDocName is the human-facing source name (short code, else full name).
|
|
func evidenceDocName(r ucca.LegalSearchResult) string {
|
|
if r.RegulationShort != "" {
|
|
return r.RegulationShort
|
|
}
|
|
return r.RegulationName
|
|
}
|
|
|
|
// evidenceSnippet returns a trimmed excerpt of at most n runes.
|
|
func evidenceSnippet(s string, n int) string {
|
|
rs := []rune(s)
|
|
if len(rs) <= n {
|
|
return s
|
|
}
|
|
return string(rs[:n]) + "…"
|
|
}
|
|
|
|
// ListRegulations returns the list of available regulations in the corpus.
|
|
// GET /sdk/v1/rag/regulations
|
|
func (h *RAGHandlers) ListRegulations(c *gin.Context) {
|
|
regs := h.ragClient.ListAvailableRegulations()
|
|
|
|
// Optionally filter by category
|
|
category := c.Query("category")
|
|
if category != "" {
|
|
filtered := make([]ucca.CERegulationInfo, 0)
|
|
for _, r := range regs {
|
|
if r.Category == category {
|
|
filtered = append(filtered, r)
|
|
}
|
|
}
|
|
regs = filtered
|
|
}
|
|
|
|
c.JSON(http.StatusOK, gin.H{
|
|
"regulations": regs,
|
|
"count": len(regs),
|
|
})
|
|
}
|
|
|
|
// CorpusStatus returns the current version status of all RAG collections.
|
|
// GET /sdk/v1/rag/corpus-status
|
|
func (h *RAGHandlers) CorpusStatus(c *gin.Context) {
|
|
if h.corpusVersionStore == nil {
|
|
c.JSON(http.StatusServiceUnavailable, gin.H{"error": "corpus version store not configured"})
|
|
return
|
|
}
|
|
|
|
versions, err := h.corpusVersionStore.GetAllLatestVersions(c.Request.Context())
|
|
if err != nil {
|
|
c.JSON(http.StatusInternalServerError, gin.H{"error": "failed to fetch corpus versions: " + err.Error()})
|
|
return
|
|
}
|
|
|
|
collections := make(map[string]gin.H)
|
|
for _, v := range versions {
|
|
collections[v.CollectionName] = gin.H{
|
|
"id": v.ID,
|
|
"current_version": v.Version,
|
|
"documents_count": v.DocumentsCount,
|
|
"chunks_count": v.ChunksCount,
|
|
"regulations": v.Regulations,
|
|
"last_updated": v.CreatedAt,
|
|
"digest": v.Digest,
|
|
}
|
|
}
|
|
|
|
c.JSON(http.StatusOK, gin.H{
|
|
"collections": collections,
|
|
})
|
|
}
|
|
|
|
// CorpusVersionHistory returns the version history for a specific collection.
|
|
// GET /sdk/v1/rag/corpus-versions/:collection
|
|
func (h *RAGHandlers) CorpusVersionHistory(c *gin.Context) {
|
|
if h.corpusVersionStore == nil {
|
|
c.JSON(http.StatusServiceUnavailable, gin.H{"error": "corpus version store not configured"})
|
|
return
|
|
}
|
|
|
|
collection := c.Param("collection")
|
|
if collection == "" {
|
|
c.JSON(http.StatusBadRequest, gin.H{"error": "collection name required"})
|
|
return
|
|
}
|
|
|
|
versions, err := h.corpusVersionStore.ListCorpusVersions(c.Request.Context(), collection)
|
|
if err != nil {
|
|
c.JSON(http.StatusInternalServerError, gin.H{"error": "failed to fetch corpus versions: " + err.Error()})
|
|
return
|
|
}
|
|
|
|
c.JSON(http.StatusOK, gin.H{
|
|
"collection": collection,
|
|
"versions": versions,
|
|
"count": len(versions),
|
|
})
|
|
}
|
|
|
|
// HandleScrollChunks scrolls/lists all chunks in a Qdrant collection with pagination.
|
|
// GET /sdk/v1/rag/scroll?collection=...&offset=...&limit=...
|
|
func (h *RAGHandlers) HandleScrollChunks(c *gin.Context) {
|
|
collection := c.Query("collection")
|
|
if collection == "" {
|
|
c.JSON(http.StatusBadRequest, gin.H{"error": "query parameter 'collection' is required"})
|
|
return
|
|
}
|
|
|
|
if !AllowedCollections[collection] {
|
|
c.JSON(http.StatusBadRequest, gin.H{"error": "Unknown collection: " + collection})
|
|
return
|
|
}
|
|
|
|
// Parse limit (default 100, max 500)
|
|
limit := 100
|
|
if limitStr := c.Query("limit"); limitStr != "" {
|
|
parsed, err := strconv.Atoi(limitStr)
|
|
if err != nil || parsed < 1 {
|
|
c.JSON(http.StatusBadRequest, gin.H{"error": "limit must be a positive integer"})
|
|
return
|
|
}
|
|
limit = parsed
|
|
}
|
|
if limit > 500 {
|
|
limit = 500
|
|
}
|
|
|
|
// Offset is optional (empty string = start from beginning)
|
|
offset := c.Query("offset")
|
|
|
|
chunks, nextOffset, err := h.ragClient.ScrollChunks(c.Request.Context(), collection, offset, limit)
|
|
if err != nil {
|
|
c.JSON(http.StatusInternalServerError, gin.H{"error": "scroll failed: " + err.Error()})
|
|
return
|
|
}
|
|
|
|
c.JSON(http.StatusOK, gin.H{
|
|
"chunks": chunks,
|
|
"next_offset": nextOffset,
|
|
"total": len(chunks),
|
|
})
|
|
}
|
|
|
|
// LegalCorpusStructure returns the composition (distinct articles, annexes,
|
|
// recitals + chunk count) of every ingested eur-lex legal act, so the coverage
|
|
// page can show WHAT was ingested instead of just the act name.
|
|
// GET /sdk/v1/rag/legal-corpus
|
|
func (h *RAGHandlers) LegalCorpusStructure(c *gin.Context) {
|
|
acts, err := h.ragClient.CorpusStructure(c.Request.Context())
|
|
if err != nil {
|
|
c.JSON(http.StatusInternalServerError, gin.H{"error": "failed to aggregate legal corpus: " + err.Error()})
|
|
return
|
|
}
|
|
|
|
arts, anns, recs := 0, 0, 0
|
|
for _, a := range acts {
|
|
arts += a.Articles
|
|
anns += a.Annexes
|
|
recs += a.Recitals
|
|
}
|
|
|
|
c.JSON(http.StatusOK, gin.H{
|
|
"regulations": acts,
|
|
"totals": gin.H{
|
|
"regulations": len(acts),
|
|
"articles": arts,
|
|
"annexes": anns,
|
|
"recitals": recs,
|
|
},
|
|
})
|
|
}
|
|
|
|
// traceClarity emits a structured CLARITY_TRACE log line per retrieve for the macmini
|
|
// test session, so qualitative user ratings can be correlated with the gate decision.
|
|
func traceClarity(query string, cl ucca.Clarity, results []ucca.LegalSearchResult) {
|
|
top := make([]string, 0, 3)
|
|
for i, r := range results {
|
|
if i >= 3 {
|
|
break
|
|
}
|
|
top = append(top, r.RegulationShort)
|
|
}
|
|
chips := make([]string, 0, len(cl.CandidateContexts))
|
|
for _, c := range cl.CandidateContexts {
|
|
chips = append(chips, fmt.Sprintf("%s:%d", c.ID, c.Hits))
|
|
}
|
|
b, _ := json.Marshal(map[string]interface{}{
|
|
"query": query,
|
|
"mode": cl.Mode,
|
|
"reason": cl.Reason,
|
|
"concentration": cl.Concentration,
|
|
"dominant": cl.DominantContext,
|
|
"chips": chips,
|
|
"top_evidence": top,
|
|
})
|
|
log.Printf("CLARITY_TRACE %s", string(b))
|
|
}
|