This repository has been archived on 2026-02-15. You can view files and clone it. You cannot open issues or pull requests or push a commit.
Files
breakpilot-pwa/edu-search-service/rules/trust_rules.yaml
Benjamin Admin 21a844cb8a fix: Restore all files lost during destructive rebase
A previous `git pull --rebase origin main` dropped 177 local commits,
losing 3400+ files across admin-v2, backend, studio-v2, website,
klausur-service, and many other services. The partial restore attempt
(660295e2) only recovered some files.

This commit restores all missing files from pre-rebase ref 98933f5e
while preserving post-rebase additions (night-scheduler, night-mode UI,
NightModeWidget dashboard integration).

Restored features include:
- AI Module Sidebar (FAB), OCR Labeling, OCR Compare
- GPU Dashboard, RAG Pipeline, Magic Help
- Klausur-Korrektur (8 files), Abitur-Archiv (5+ files)
- Companion, Zeugnisse-Crawler, Screen Flow
- Full backend, studio-v2, website, klausur-service
- All compliance SDKs, agent-core, voice-service
- CI/CD configs, documentation, scripts

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-09 09:51:32 +01:00

118 lines
2.8 KiB
YAML

# Trust Score Regeln für Education Search
# Score-Berechnung: Summe aller matchenden Regeln, dann clamp(0, 1)
domain_boosts:
# Bundesebene (höchste Vertrauensstufe)
- match: "*.kmk.org"
add: 0.50
reason: "KMK - Kultusministerkonferenz"
- match: "*.bildungsserver.de"
add: 0.50
reason: "Deutscher Bildungsserver"
- match: "*.bpb.de"
add: 0.45
reason: "Bundeszentrale für politische Bildung"
- match: "*.bmbf.de"
add: 0.50
reason: "BMBF"
- match: "*.iqb.hu-berlin.de"
add: 0.50
reason: "IQB Bildungsstandards"
# Landesministerien
- match: "*.bayern.de"
add: 0.45
reason: "Bayern offiziell"
- match: "*.nrw.de"
add: 0.45
reason: "NRW offiziell"
- match: "*.berlin.de"
add: 0.45
reason: "Berlin offiziell"
- match: "*.sachsen.de"
add: 0.45
reason: "Sachsen offiziell"
- match: "*.niedersachsen.de"
add: 0.45
reason: "Niedersachsen offiziell"
- match: "*.hessen.de"
add: 0.45
reason: "Hessen offiziell"
- match: "*.brandenburg.de"
add: 0.45
reason: "Brandenburg offiziell"
- match: "*.thueringen.de"
add: 0.45
reason: "Thüringen offiziell"
# Bildungsserver der Länder
- match: "*.nibis.de"
add: 0.40
reason: "Niedersachsen Bildungsserver"
- match: "*.learnline.nrw.de"
add: 0.40
reason: "NRW Bildungsserver"
- match: "*.schule-bw.de"
add: 0.40
reason: "BW Bildungsserver"
# Universitäten
- match: "*.uni-*.de"
add: 0.30
reason: "Deutsche Universität"
- match: "*.tu-*.de"
add: 0.30
reason: "Technische Universität"
- match: "*.fh-*.de"
add: 0.25
reason: "Fachhochschule"
# Etablierte Portale
- match: "*.zum.de"
add: 0.25
reason: "ZUM - Zentrale für Unterrichtsmedien"
- match: "*.lehrer-online.de"
add: 0.20
reason: "Lehrer-Online Portal"
- match: "*.4teachers.de"
add: 0.20
reason: "4teachers Portal"
tld_boosts:
- tld: ".gov"
add: 0.40
reason: "Government TLD"
- tld: ".edu"
add: 0.35
reason: "Education TLD"
penalties:
# URL-Muster die Werbung/Tracking andeuten
- if_url_contains: ["utm_", "affiliate", "partner=", "ref="]
add: -0.10
reason: "Tracking/Affiliate Parameter"
# Kommerzielle Signale
- if_url_contains: ["shop", "kaufen", "bestellen", "warenkorb"]
add: -0.20
reason: "E-Commerce Signale"
# SEO-Spam Indikatoren
- if_url_contains: ["gratis-", "kostenlos-download", "sofort-"]
add: -0.15
reason: "SEO-Spam Muster"
# Content-basierte Strafen (werden vom Extractor gesetzt)
content_penalties:
- if_ad_density_gt: 0.20
add: -0.30
reason: "Hoher Werbeanteil"
- if_link_density_gt: 0.40
add: -0.20
reason: "Hohe Link-Dichte (Linkfarm)"
- if_content_length_lt: 200
add: -0.25
reason: "Sehr wenig Content"