feat(ai-sdk): controlled interpretation-intent guidance override (#34)
CI / detect-changes (push) Successful in 5s
CI / branch-name (push) Has been skipped
CI / guardrail-integrity (push) Has been skipped
CI / secret-scan (push) Has been skipped
CI / dep-audit (push) Has been skipped
CI / sbom-scan (push) Has been skipped
CI / build-sha-integrity (push) Successful in 5s
CI / validate-canonical-controls (push) Successful in 3s
CI / loc-budget (push) Successful in 17s
CI / go-lint (push) Has been skipped
CI / python-lint (push) Has been skipped
CI / nodejs-lint (push) Has been skipped
CI / nodejs-build (push) Has been skipped
CI / test-go (push) Successful in 57s
CI / iace-gt-coverage (push) Successful in 15s
CI / test-python-backend (push) Has been skipped
CI / test-python-document-crawler (push) Has been skipped
CI / test-python-dsms-gateway (push) Has been skipped
CI / detect-changes (push) Successful in 5s
CI / branch-name (push) Has been skipped
CI / guardrail-integrity (push) Has been skipped
CI / secret-scan (push) Has been skipped
CI / dep-audit (push) Has been skipped
CI / sbom-scan (push) Has been skipped
CI / build-sha-integrity (push) Successful in 5s
CI / validate-canonical-controls (push) Successful in 3s
CI / loc-budget (push) Successful in 17s
CI / go-lint (push) Has been skipped
CI / python-lint (push) Has been skipped
CI / nodejs-lint (push) Has been skipped
CI / nodejs-build (push) Has been skipped
CI / test-go (push) Successful in 57s
CI / iace-gt-coverage (push) Successful in 15s
CI / test-python-backend (push) Has been skipped
CI / test-python-document-crawler (push) Has been skipped
CI / test-python-dsms-gateway (push) Has been skipped
This commit was merged in pull request #34.
This commit is contained in:
@@ -1,6 +1,9 @@
|
|||||||
package ucca
|
package ucca
|
||||||
|
|
||||||
import "sort"
|
import (
|
||||||
|
"sort"
|
||||||
|
"strings"
|
||||||
|
)
|
||||||
|
|
||||||
// Re-ranking coefficients (validated in the offline golden harness; Phase A — conservative).
|
// Re-ranking coefficients (validated in the offline golden harness; Phase A — conservative).
|
||||||
const (
|
const (
|
||||||
@@ -13,8 +16,46 @@ const (
|
|||||||
scopePenalty = 0.25 // BDSG Teil 3 (law enforcement) on a general DP question
|
scopePenalty = 0.25 // BDSG Teil 3 (law enforcement) on a general DP question
|
||||||
topicGain = 0.18 // amplifier only
|
topicGain = 0.18 // amplifier only
|
||||||
supersededPenalty = 0.50 // superseded Alt-Quelle (pre-eu-v1): demoted, nicht versteckt
|
supersededPenalty = 0.50 // superseded Alt-Quelle (pre-eu-v1): demoted, nicht versteckt
|
||||||
|
guidanceIntentGain = 0.25 // controlled guidance override on explicit interpretation intent
|
||||||
|
guidanceIntentMargin = 0.05 // ...only if the guideline is semantically competitive with binding
|
||||||
)
|
)
|
||||||
|
|
||||||
|
// guidanceIntentSignals mark a query that EXPLICITLY asks for an interpretation /
|
||||||
|
// recommendation by a guidance body, rather than for the binding obligation. Only
|
||||||
|
// then may a (semantically competitive) guideline outrank the binding norm.
|
||||||
|
var guidanceIntentSignals = []string{
|
||||||
|
"edpb", "europäischer datenschutzausschuss", "europaeischer datenschutzausschuss",
|
||||||
|
"dsk", "enisa", "bsi", "leitlinie", "guideline", "orientierungshilfe",
|
||||||
|
"auslegung", "empfiehlt", "empfehlung", "sagt", "laut",
|
||||||
|
}
|
||||||
|
|
||||||
|
// queryWantsGuidance reports whether the query explicitly asks for guidance/interpretation.
|
||||||
|
func queryWantsGuidance(query string) bool {
|
||||||
|
q := strings.ToLower(query)
|
||||||
|
for _, sig := range guidanceIntentSignals {
|
||||||
|
if strings.Contains(q, sig) {
|
||||||
|
return true
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return false
|
||||||
|
}
|
||||||
|
|
||||||
|
// bestBindingSemantic returns the highest RAW semantic score among binding-law
|
||||||
|
// results (0 if none / intent not requested). Used as the guard threshold so an
|
||||||
|
// off-topic guideline cannot ride the interpretation-intent boost.
|
||||||
|
func bestBindingSemantic(results []LegalSearchResult, wantsGuidance bool) float64 {
|
||||||
|
if !wantsGuidance {
|
||||||
|
return 0
|
||||||
|
}
|
||||||
|
best := 0.0
|
||||||
|
for _, r := range results {
|
||||||
|
if r.SourceClass == "binding_law" && r.Score > best {
|
||||||
|
best = r.Score
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return best
|
||||||
|
}
|
||||||
|
|
||||||
// authorityScore computes the normative relevance of a result for a query. It augments the
|
// authorityScore computes the normative relevance of a result for a query. It augments the
|
||||||
// semantic score with authority/jurisdiction/domain/scope/topic signals. Exposed for tests.
|
// semantic score with authority/jurisdiction/domain/scope/topic signals. Exposed for tests.
|
||||||
func authorityScore(query string, r LegalSearchResult, qDomain string, qForeign bool) float64 {
|
func authorityScore(query string, r LegalSearchResult, qDomain string, qForeign bool) float64 {
|
||||||
@@ -62,11 +103,21 @@ func rerankByAuthority(query string, results []LegalSearchResult) []LegalSearchR
|
|||||||
}
|
}
|
||||||
qDomain := queryDomain(query)
|
qDomain := queryDomain(query)
|
||||||
qForeign := queryIsForeign(query)
|
qForeign := queryIsForeign(query)
|
||||||
|
wantsGuidance := queryWantsGuidance(query)
|
||||||
|
bestBindingSem := bestBindingSemantic(results, wantsGuidance)
|
||||||
|
|
||||||
out := make([]LegalSearchResult, len(results))
|
out := make([]LegalSearchResult, len(results))
|
||||||
copy(out, results)
|
copy(out, results)
|
||||||
for i := range out {
|
for i := range out {
|
||||||
out[i].Score = authorityScore(query, out[i], qDomain, qForeign)
|
out[i].Score = authorityScore(query, out[i], qDomain, qForeign)
|
||||||
|
// Interpretations-Intent (eng begrenzt): NUR wenn die Query explizit nach
|
||||||
|
// Guidance/Auslegung fragt UND die Leitlinie semantisch konkurrenzfaehig ist
|
||||||
|
// (>= bester binding-Treffer - margin), darf supervisory_guidance die bindende
|
||||||
|
// Norm ueberholen. Sonst bleibt binding > guidance (Normfrage unveraendert).
|
||||||
|
if wantsGuidance && out[i].SourceClass == "supervisory_guidance" &&
|
||||||
|
results[i].Score >= bestBindingSem-guidanceIntentMargin {
|
||||||
|
out[i].Score += guidanceIntentGain
|
||||||
|
}
|
||||||
}
|
}
|
||||||
sort.SliceStable(out, func(a, b int) bool {
|
sort.SliceStable(out, func(a, b int) bool {
|
||||||
return out[a].Score > out[b].Score
|
return out[a].Score > out[b].Score
|
||||||
|
|||||||
@@ -0,0 +1,72 @@
|
|||||||
|
package ucca
|
||||||
|
|
||||||
|
import "testing"
|
||||||
|
|
||||||
|
func intentRes(reg, sourceClass string, sem float64, weight int) LegalSearchResult {
|
||||||
|
return LegalSearchResult{
|
||||||
|
RegulationShort: reg, SourceClass: sourceClass, Score: sem,
|
||||||
|
AuthorityWeight: weight, Jurisdiction: "EU",
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
func TestQueryWantsGuidance(t *testing.T) {
|
||||||
|
wants := []string{
|
||||||
|
"Was empfiehlt der EDPB zum DSB?",
|
||||||
|
"Was sagt die ENISA zu Security Updates?",
|
||||||
|
"laut DSK ...",
|
||||||
|
"Orientierungshilfe zur DSFA",
|
||||||
|
"Welche BSI-Empfehlung gilt?",
|
||||||
|
"Auslegung der Aufsichtsbehörde",
|
||||||
|
}
|
||||||
|
plain := []string{
|
||||||
|
"Ab wann braucht man einen Datenschutzbeauftragten?",
|
||||||
|
"Welche Anforderungen bestehen an Security Updates?",
|
||||||
|
}
|
||||||
|
for _, q := range wants {
|
||||||
|
if !queryWantsGuidance(q) {
|
||||||
|
t.Errorf("should detect interpretation intent: %q", q)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
for _, q := range plain {
|
||||||
|
if queryWantsGuidance(q) {
|
||||||
|
t.Errorf("should NOT detect intent (norm question): %q", q)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
func TestRerank_NormQuestion_BindingStaysTop(t *testing.T) {
|
||||||
|
// No intent signal → binding wins even though guidance is semantically higher.
|
||||||
|
results := []LegalSearchResult{
|
||||||
|
intentRes("EDPB DPO", "supervisory_guidance", 0.64, 70),
|
||||||
|
intentRes("DSGVO", "binding_law", 0.58, 100),
|
||||||
|
}
|
||||||
|
out := rerankByAuthority("Ab wann braucht man einen Datenschutzbeauftragten?", results)
|
||||||
|
if out[0].SourceClass != "binding_law" {
|
||||||
|
t.Errorf("norm question: binding must stay Top-1, got %s", out[0].SourceClass)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
func TestRerank_InterpretationQuestion_GuidanceMayWin(t *testing.T) {
|
||||||
|
// Explicit intent + guidance semantically competitive → guidance wins.
|
||||||
|
results := []LegalSearchResult{
|
||||||
|
intentRes("EDPB DPO", "supervisory_guidance", 0.64, 70),
|
||||||
|
intentRes("DSGVO", "binding_law", 0.58, 100),
|
||||||
|
}
|
||||||
|
out := rerankByAuthority("Was empfiehlt der EDPB zum Datenschutzbeauftragten?", results)
|
||||||
|
if out[0].SourceClass != "supervisory_guidance" {
|
||||||
|
t.Errorf("interpretation question: guidance should win Top-1, got %s", out[0].SourceClass)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
func TestRerank_OffTopicGuidance_BlockedByGuard(t *testing.T) {
|
||||||
|
// Intent present, but guidance semantic is far below the best binding hit →
|
||||||
|
// the margin guard keeps binding on top (no off-topic guideline override).
|
||||||
|
results := []LegalSearchResult{
|
||||||
|
intentRes("EDPB DPO", "supervisory_guidance", 0.40, 70),
|
||||||
|
intentRes("DSGVO", "binding_law", 0.58, 100),
|
||||||
|
}
|
||||||
|
out := rerankByAuthority("Was empfiehlt der EDPB zum Datenschutzbeauftragten?", results)
|
||||||
|
if out[0].SourceClass != "binding_law" {
|
||||||
|
t.Errorf("off-topic guidance must not win even with intent, got %s", out[0].SourceClass)
|
||||||
|
}
|
||||||
|
}
|
||||||
Reference in New Issue
Block a user