Files
breakpilot-compliance/backend-compliance/tests/test_cross_placement_agent.py
T
Benjamin Admin 154e8c293b
CI / detect-changes (push) Successful in 6s
CI / branch-name (push) Has been skipped
CI / guardrail-integrity (push) Has been skipped
CI / secret-scan (push) Has been skipped
CI / dep-audit (push) Has been skipped
CI / sbom-scan (push) Has been skipped
CI / build-sha-integrity (push) Failing after 4s
CI / validate-canonical-controls (push) Successful in 11s
CI / loc-budget (push) Successful in 14s
CI / go-lint (push) Has been skipped
CI / python-lint (push) Has been skipped
CI / nodejs-lint (push) Has been skipped
CI / nodejs-build (push) Has been skipped
CI / test-go (push) Has been skipped
CI / iace-gt-coverage (push) Has been skipped
CI / test-python-backend (push) Successful in 29s
CI / test-python-document-crawler (push) Has been skipped
CI / test-python-dsms-gateway (push) Has been skipped
feat(agents): Cross-Placement-Agent (deplatzierter Content)
Sprint 1.9 (User-Vorgabe 2026-06-09):

Erkennt im Impressum Inhalts-Sektionen die thematisch besser in
einen Footer-Reiter 'Legal' gehoeren:
  - Urheberrecht / Copyright          -> LOW  (Footer 'Legal')
  - Bilder & Lizenzen                  -> LOW  (Seite 'Bildquellen')
  - Haftungsausschluss / Disclaimer    -> LOW  (Seite 'Disclaimer')
  - Nutzungsbedingungen                -> LOW  (Seite 'AGB')
  - Aenderungsvorbehalt                -> LOW
  - ElektroG / WEEE-Reg                -> MEDIUM (Produktinfo)
  - VerpackG / LUCID                   -> MEDIUM
  - BattG                              -> MEDIUM

Each Finding empfiehlt konkret den 'Legal'-Footer-Reiter
einzufuehren als Best Practice ('Impressum bleibt schlank
und enthaelt ausschliesslich die Pflichtangaben nach § 5
TMG/DDG').

Tests gegen die 5 GT-Impressums:
  - Safetykon: 3 Findings (Urheberrecht, Bilder/Lizenzen,
    Haftungsausschluss)
  - Hectronic: 3 Findings (WEEE-MEDIUM, Copyright, Haftung)
  - ETO/BMW/Elli: 0 Findings (sauber)
  - 9/9 Tests gruen.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
2026-06-09 08:19:57 +02:00

123 lines
3.9 KiB
Python

"""Tests für den Cross-Placement-Agent (deplatzierter Content)."""
from __future__ import annotations
import asyncio
import pytest
from compliance.services.specialist_agents import (
REGISTRY,
AgentInput,
CrossPlacementAgent,
Severity,
)
from tests.fixtures.impressum_groundtruth import (
ETO, HECTRONIC, SAFETYKON, BMW,
)
def _run(coro):
return asyncio.get_event_loop().run_until_complete(coro)
def test_agent_is_registered():
agent = REGISTRY.get("cross_placement")
assert agent is not None
assert agent.doc_type == "impressum"
def test_short_text_skipped():
agent = CrossPlacementAgent()
out = _run(agent.evaluate(AgentInput(doc_type="impressum", text="x")))
assert all(c.status == "skipped" for c in out.mc_coverage)
def test_eto_finds_nutzungsbedingungen_and_haftung():
"""ETO-Impressum hat Nutzungsbedingungen + Haftungsbeschränkung —
Cross-Placement-Agent muss das melden."""
agent = CrossPlacementAgent()
out = _run(agent.evaluate(AgentInput(
doc_type="impressum", text=ETO.text,
)))
field_ids = {f.field_id for f in out.findings}
# ETO-Impressum hat keine Sektionen wie Copyright/Disclaimer →
# nur die Pflichtangaben. Test prüft dass ETO sauber ist.
# User-GT: placement_concerns = () → 0 Findings erwartet
assert not out.findings, (
f"ETO sollte keine Placement-Findings haben, hat aber: "
f"{field_ids}"
)
def test_safetykon_finds_urheberrecht_and_haftung():
"""Safetykon hat Urheberrecht + Bilder/Lizenzen + Haftungsausschluss
im Impressum-Block — alle drei sollen gemeldet werden."""
agent = CrossPlacementAgent()
out = _run(agent.evaluate(AgentInput(
doc_type="impressum", text=SAFETYKON.text,
)))
field_ids = {f.field_id for f in out.findings}
assert "urheberrecht" in field_ids
assert "bilder_lizenzen" in field_ids
assert "haftungsausschluss" in field_ids
def test_hectronic_finds_weee_copyright_haftung():
"""Hectronic hat WEEE-Reg + Copyright + Haftungsausschluss im
Impressum-Block."""
agent = CrossPlacementAgent()
out = _run(agent.evaluate(AgentInput(
doc_type="impressum", text=HECTRONIC.text,
)))
field_ids = {f.field_id for f in out.findings}
assert "weee_elektrog" in field_ids
assert "urheberrecht" in field_ids # 'Copyright' heading
assert "haftungsausschluss" in field_ids
def test_bmw_is_clean():
"""BMW-Impressum ist sauber (nur Pflichtangaben) — 0 Findings."""
agent = CrossPlacementAgent()
out = _run(agent.evaluate(AgentInput(
doc_type="impressum", text=BMW.text,
)))
assert not out.findings, (
f"BMW sollte sauber sein, hat aber: "
f"{[f.field_id for f in out.findings]}"
)
def test_recommendation_mentions_legal_footer():
"""Best-Practice-Empfehlung muss 'Legal'-Footer-Tab vorschlagen."""
agent = CrossPlacementAgent()
out = _run(agent.evaluate(AgentInput(
doc_type="impressum", text=HECTRONIC.text,
)))
assert out.findings
sample = out.findings[0]
assert "Legal" in sample.action
assert "Footer" in sample.action
def test_weee_is_product_compliance_medium():
"""ElektroG/WEEE ist eine echte Pflicht aber Ort umstritten →
MEDIUM statt LOW."""
agent = CrossPlacementAgent()
out = _run(agent.evaluate(AgentInput(
doc_type="impressum", text=HECTRONIC.text,
)))
weee = next(f for f in out.findings if f.field_id == "weee_elektrog")
assert weee.severity == Severity.MEDIUM.value
def test_copyright_is_low():
"""Copyright/Urheberrecht ist BPa nicht zwingend Impressum-Pflicht →
LOW."""
agent = CrossPlacementAgent()
out = _run(agent.evaluate(AgentInput(
doc_type="impressum", text=SAFETYKON.text,
)))
cp = next(f for f in out.findings if f.field_id == "urheberrecht")
assert cp.severity == Severity.LOW.value