feat(ai-sdk): demote superseded pre-eu-v1 sources in authority rerank

The old pre-eu-v1 corpus chunks (un-annotated CRA/AI Act/DORA/NIS2/DSGVO duplicates + the old Machinery Directive and its guide) are tagged status=superseded / use_for_primary=false in the vector store. Honor that in the rerank: a superseded result takes a fixed penalty so the eu-v1 norm wins default questions, while the old source stays in the pool (demoted, not hidden) and remains findable for history / transition questions. Verified on dev: "CRA Sicherheitsupdates" now returns CRA Anhang I (eu-v1) at #1 instead of an un-annotated old chunk; MaschinenVO outranks the old Machinery Directive/guide; superseded chunks remain retrievable lower down. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
feat(ai-sdk): citation-graph assessment + opt-in graph expansion (Phase 2)
2026-06-24 00:22:37 +02:00 · 2026-06-23 19:48:01 +02:00 · 2026-06-23 19:47:17 +02:00
2 changed files with 10 additions and 133 deletions
@@ -1,61 +1,20 @@
 package ucca

-import (
-	"sort"
-	"strings"
-)
+import "sort"

 // Re-ranking coefficients (validated in the offline golden harness; Phase A — conservative).
 const (
-	authorityCoef        = 0.40 // * weight/100
-	jurisdictionGain     = 0.05 // binding/guidance from DE or EU
-	foreignPenalty       = 0.60 // foreign law on a DE/EU question (demoted, not removed)
-	unknownPenalty       = 0.08
-	domainMatchGain      = 0.15
-	offDomainPenalty     = 0.10 // off-domain binding (demoted, not removed)
-	scopePenalty         = 0.25 // BDSG Teil 3 (law enforcement) on a general DP question
-	topicGain            = 0.18 // amplifier only
-	supersededPenalty    = 0.50 // superseded Alt-Quelle (pre-eu-v1): demoted, nicht versteckt
-	guidanceIntentGain   = 0.25 // controlled guidance override on explicit interpretation intent
-	guidanceIntentMargin = 0.05 // ...only if the guideline is semantically competitive with binding
+	authorityCoef     = 0.40 // * weight/100
+	jurisdictionGain  = 0.05 // binding/guidance from DE or EU
+	foreignPenalty    = 0.60 // foreign law on a DE/EU question (demoted, not removed)
+	unknownPenalty    = 0.08
+	domainMatchGain   = 0.15
+	offDomainPenalty  = 0.10 // off-domain binding (demoted, not removed)
+	scopePenalty      = 0.25 // BDSG Teil 3 (law enforcement) on a general DP question
+	topicGain         = 0.18 // amplifier only
+	supersededPenalty = 0.50 // superseded Alt-Quelle (pre-eu-v1): demoted, nicht versteckt
 )

-// guidanceIntentSignals mark a query that EXPLICITLY asks for an interpretation /
-// recommendation by a guidance body, rather than for the binding obligation. Only
-// then may a (semantically competitive) guideline outrank the binding norm.
-var guidanceIntentSignals = []string{
-	"edpb", "europäischer datenschutzausschuss", "europaeischer datenschutzausschuss",
-	"dsk", "enisa", "bsi", "leitlinie", "guideline", "orientierungshilfe",
-	"auslegung", "empfiehlt", "empfehlung", "sagt", "laut",
-}
-
-// queryWantsGuidance reports whether the query explicitly asks for guidance/interpretation.
-func queryWantsGuidance(query string) bool {
-	q := strings.ToLower(query)
-	for _, sig := range guidanceIntentSignals {
-		if strings.Contains(q, sig) {
-			return true
-		}
-	}
-	return false
-}
-
-// bestBindingSemantic returns the highest RAW semantic score among binding-law
-// results (0 if none / intent not requested). Used as the guard threshold so an
-// off-topic guideline cannot ride the interpretation-intent boost.
-func bestBindingSemantic(results []LegalSearchResult, wantsGuidance bool) float64 {
-	if !wantsGuidance {
-		return 0
-	}
-	best := 0.0
-	for _, r := range results {
-		if r.SourceClass == "binding_law" && r.Score > best {
-			best = r.Score
-		}
-	}
-	return best
-}
-
 // authorityScore computes the normative relevance of a result for a query. It augments the
 // semantic score with authority/jurisdiction/domain/scope/topic signals. Exposed for tests.
 func authorityScore(query string, r LegalSearchResult, qDomain string, qForeign bool) float64 {
@@ -103,21 +62,11 @@ func rerankByAuthority(query string, results []LegalSearchResult) []LegalSearchR
 	}
 	qDomain := queryDomain(query)
 	qForeign := queryIsForeign(query)
-	wantsGuidance := queryWantsGuidance(query)
-	bestBindingSem := bestBindingSemantic(results, wantsGuidance)

 	out := make([]LegalSearchResult, len(results))
 	copy(out, results)
 	for i := range out {
 		out[i].Score = authorityScore(query, out[i], qDomain, qForeign)
-		// Interpretations-Intent (eng begrenzt): NUR wenn die Query explizit nach
-		// Guidance/Auslegung fragt UND die Leitlinie semantisch konkurrenzfaehig ist
-		// (>= bester binding-Treffer - margin), darf supervisory_guidance die bindende
-		// Norm ueberholen. Sonst bleibt binding > guidance (Normfrage unveraendert).
-		if wantsGuidance && out[i].SourceClass == "supervisory_guidance" &&
-			results[i].Score >= bestBindingSem-guidanceIntentMargin {
-			out[i].Score += guidanceIntentGain
-		}
 	}
 	sort.SliceStable(out, func(a, b int) bool {
 		return out[a].Score > out[b].Score
@@ -1,72 +0,0 @@
-package ucca
-
-import "testing"
-
-func intentRes(reg, sourceClass string, sem float64, weight int) LegalSearchResult {
-	return LegalSearchResult{
-		RegulationShort: reg, SourceClass: sourceClass, Score: sem,
-		AuthorityWeight: weight, Jurisdiction: "EU",
-	}
-}
-
-func TestQueryWantsGuidance(t *testing.T) {
-	wants := []string{
-		"Was empfiehlt der EDPB zum DSB?",
-		"Was sagt die ENISA zu Security Updates?",
-		"laut DSK ...",
-		"Orientierungshilfe zur DSFA",
-		"Welche BSI-Empfehlung gilt?",
-		"Auslegung der Aufsichtsbehörde",
-	}
-	plain := []string{
-		"Ab wann braucht man einen Datenschutzbeauftragten?",
-		"Welche Anforderungen bestehen an Security Updates?",
-	}
-	for _, q := range wants {
-		if !queryWantsGuidance(q) {
-			t.Errorf("should detect interpretation intent: %q", q)
-		}
-	}
-	for _, q := range plain {
-		if queryWantsGuidance(q) {
-			t.Errorf("should NOT detect intent (norm question): %q", q)
-		}
-	}
-}
-
-func TestRerank_NormQuestion_BindingStaysTop(t *testing.T) {
-	// No intent signal → binding wins even though guidance is semantically higher.
-	results := []LegalSearchResult{
-		intentRes("EDPB DPO", "supervisory_guidance", 0.64, 70),
-		intentRes("DSGVO", "binding_law", 0.58, 100),
-	}
-	out := rerankByAuthority("Ab wann braucht man einen Datenschutzbeauftragten?", results)
-	if out[0].SourceClass != "binding_law" {
-		t.Errorf("norm question: binding must stay Top-1, got %s", out[0].SourceClass)
-	}
-}
-
-func TestRerank_InterpretationQuestion_GuidanceMayWin(t *testing.T) {
-	// Explicit intent + guidance semantically competitive → guidance wins.
-	results := []LegalSearchResult{
-		intentRes("EDPB DPO", "supervisory_guidance", 0.64, 70),
-		intentRes("DSGVO", "binding_law", 0.58, 100),
-	}
-	out := rerankByAuthority("Was empfiehlt der EDPB zum Datenschutzbeauftragten?", results)
-	if out[0].SourceClass != "supervisory_guidance" {
-		t.Errorf("interpretation question: guidance should win Top-1, got %s", out[0].SourceClass)
-	}
-}
-
-func TestRerank_OffTopicGuidance_BlockedByGuard(t *testing.T) {
-	// Intent present, but guidance semantic is far below the best binding hit →
-	// the margin guard keeps binding on top (no off-topic guideline override).
-	results := []LegalSearchResult{
-		intentRes("EDPB DPO", "supervisory_guidance", 0.40, 70),
-		intentRes("DSGVO", "binding_law", 0.58, 100),
-	}
-	out := rerankByAuthority("Was empfiehlt der EDPB zum Datenschutzbeauftragten?", results)
-	if out[0].SourceClass != "binding_law" {
-		t.Errorf("off-topic guidance must not win even with intent, got %s", out[0].SourceClass)
-	}
-}
Author	SHA1	Message	Date
Benjamin Admin	c28c532958	feat(ai-sdk): demote superseded pre-eu-v1 sources in authority rerank CI / detect-changes (pull_request) Successful in 18s Details CI / branch-name (pull_request) Successful in 1s Details CI / guardrail-integrity (pull_request) Successful in 14s Details CI / secret-scan (pull_request) Successful in 16s Details CI / dep-audit (pull_request) Failing after 1m3s Details CI / sbom-scan (pull_request) Failing after 1m8s Details CI / build-sha-integrity (pull_request) Successful in 16s Details CI / validate-canonical-controls (pull_request) Successful in 14s Details CI / loc-budget (pull_request) Successful in 24s Details CI / go-lint (pull_request) Successful in 57s Details CI / python-lint (pull_request) Failing after 20s Details CI / nodejs-lint (pull_request) Failing after 1m13s Details CI / nodejs-build (pull_request) Successful in 3m9s Details CI / test-go (pull_request) Successful in 1m3s Details CI / iace-gt-coverage (pull_request) Successful in 26s Details CI / test-python-backend (pull_request) Successful in 36s Details CI / test-python-document-crawler (pull_request) Successful in 20s Details CI / test-python-dsms-gateway (pull_request) Successful in 18s Details The old pre-eu-v1 corpus chunks (un-annotated CRA/AI Act/DORA/NIS2/DSGVO duplicates + the old Machinery Directive and its guide) are tagged status=superseded / use_for_primary=false in the vector store. Honor that in the rerank: a superseded result takes a fixed penalty so the eu-v1 norm wins default questions, while the old source stays in the pool (demoted, not hidden) and remains findable for history / transition questions. Verified on dev: "CRA Sicherheitsupdates" now returns CRA Anhang I (eu-v1) at #1 instead of an un-annotated old chunk; MaschinenVO outranks the old Machinery Directive/guide; superseded chunks remain retrievable lower down. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-06-24 00:22:37 +02:00
Benjamin Admin	989d9f6f91	feat(ai-sdk): citation-graph assessment + opt-in graph expansion (Phase 2) CI / detect-changes (pull_request) Successful in 14s Details CI / branch-name (pull_request) Successful in 1s Details CI / guardrail-integrity (pull_request) Successful in 16s Details CI / secret-scan (pull_request) Successful in 18s Details CI / dep-audit (pull_request) Failing after 1m2s Details CI / sbom-scan (pull_request) Failing after 1m10s Details CI / build-sha-integrity (pull_request) Successful in 13s Details CI / validate-canonical-controls (pull_request) Successful in 14s Details CI / loc-budget (pull_request) Successful in 23s Details CI / go-lint (pull_request) Successful in 50s Details CI / python-lint (pull_request) Failing after 18s Details CI / nodejs-lint (pull_request) Failing after 1m8s Details CI / nodejs-build (pull_request) Successful in 3m7s Details CI / test-go (pull_request) Successful in 1m6s Details CI / iace-gt-coverage (pull_request) Successful in 26s Details CI / test-python-backend (pull_request) Successful in 33s Details CI / test-python-document-crawler (pull_request) Successful in 21s Details CI / test-python-dsms-gateway (pull_request) Successful in 21s Details Add an `assessment` object to the legal RAG search response: primary norm, connected norms (from the citation graph references_out/in of the primary), cross_regime, human_review_flag, a norm-level winner_margin and a short reasoning string. The margin is computed over DISTINCT norms, so a long article split into several chunks no longer fabricates uncertainty. The per-result schema stays frozen — graph fields are internal (json:"-"). Also wire optional citation-graph expansion (RAG_GRAPH_EXPANSION=true, default off): top hits pull their referenced norms into the candidate pool via the precise edge (e.g. Art. 13 CRA -> Anhang I). Measured to add no rank gain over the existing binding-law augmentation, with +1 Qdrant call per search and reverse-edge fan-out risk, so it ships off-by-default as a recall safety net. The graph EXPLAINS retrieval (assessment), it does not expand it by default. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-06-23 19:48:01 +02:00
Benjamin Admin	4c99773fa1	feat(ai-sdk): legal-corpus structure endpoint + coverage page Expose GET /sdk/v1/rag/legal-corpus, which scrolls the eur-lex legal corpus (filtered to a few hundred points regardless of total size) and aggregates each ingested act's composition: distinct articles, annexes, recitals and chunk count. Surface it as a new section on /sdk/coverage so the ingested corpus is no longer a black box — a developer SEES what each act actually contains, not only its name. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>	2026-06-23 19:47:17 +02:00