This repository has been archived on 2026-02-15. You can view files and clone it. You cannot open issues or pull requests or push a commit.
Files
breakpilot-pwa/edu-search-service/rules/subject_rules.yaml
Benjamin Admin 21a844cb8a fix: Restore all files lost during destructive rebase
A previous `git pull --rebase origin main` dropped 177 local commits,
losing 3400+ files across admin-v2, backend, studio-v2, website,
klausur-service, and many other services. The partial restore attempt
(660295e2) only recovered some files.

This commit restores all missing files from pre-rebase ref 98933f5e
while preserving post-rebase additions (night-scheduler, night-mode UI,
NightModeWidget dashboard integration).

Restored features include:
- AI Module Sidebar (FAB), OCR Labeling, OCR Compare
- GPU Dashboard, RAG Pipeline, Magic Help
- Klausur-Korrektur (8 files), Abitur-Archiv (5+ files)
- Companion, Zeugnisse-Crawler, Screen Flow
- Full backend, studio-v2, website, klausur-service
- All compliance SDKs, agent-core, voice-service
- CI/CD configs, documentation, scripts

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-09 09:51:32 +01:00

286 lines
5.0 KiB
YAML

# Subject (Fach) Tagging Regeln
# Format: strong (+3), weak (+1), negative (-2)
subjects:
Mathe:
strong:
- "mathematik"
- "mathe"
- "algebra"
- "geometrie"
- "stochastik"
- "analysis"
- "prozentrechnung"
- "gleichungen"
- "funktionen"
- "trigonometrie"
- "wahrscheinlichkeit"
weak:
- "zahlen"
- "terme"
- "diagramme"
- "brueche"
- "dreisatz"
- "rechnen"
negative: []
Deutsch:
strong:
- "deutschunterricht"
- "grammatik"
- "rechtschreibung"
- "aufsatz"
- "textanalyse"
- "literatur"
- "argumentation"
- "erzaehlung"
- "lyrik"
- "drama"
- "epik"
weak:
- "lesen"
- "schreiben"
- "woerter"
- "satzglieder"
negative:
- "deutschland"
- "deutsche geschichte"
Englisch:
strong:
- "englischunterricht"
- "english"
- "grammar"
- "vocabulary"
- "reading comprehension"
- "listening"
- "speaking"
weak:
- "text"
- "dialogue"
negative: []
Franzoesisch:
strong:
- "franzoesisch"
- "francais"
- "french"
- "grammaire"
weak:
- "texte"
negative: []
Latein:
strong:
- "latein"
- "lateinunterricht"
- "grammatik latein"
weak:
- "uebersetzung"
- "vokabel"
negative: []
Biologie:
strong:
- "biologie"
- "bio"
- "oekologie"
- "evolution"
- "genetik"
- "zellbiologie"
- "stoffwechsel"
- "neurobiologie"
weak:
- "zelle"
- "organismus"
- "lebewesen"
negative: []
Chemie:
strong:
- "chemie"
- "chemieunterricht"
- "organische chemie"
- "anorganische chemie"
- "reaktionsgleichung"
- "periodensystem"
weak:
- "element"
- "verbindung"
- "reaktion"
negative: []
Physik:
strong:
- "physik"
- "physikunterricht"
- "mechanik"
- "elektrizitaet"
- "optik"
- "thermodynamik"
- "quantenphysik"
weak:
- "energie"
- "kraft"
- "bewegung"
negative: []
Informatik:
strong:
- "informatik"
- "programmierung"
- "algorithmus"
- "datenstruktur"
- "python"
- "java"
- "sql"
- "netzwerke"
weak:
- "code"
- "daten"
- "computer"
negative: []
Geschichte:
strong:
- "geschichtsunterricht"
- "historisch"
- "weimarer republik"
- "nationalsozialismus"
- "mittelalter"
- "aufklaerung"
- "industrialisierung"
- "antike"
- "renaissance"
weak:
- "quelle"
- "chronologie"
- "epoche"
negative: []
Politik_Sozialkunde:
strong:
- "politik"
- "politikunterricht"
- "sozialkunde"
- "gemeinschaftskunde"
- "demokratie"
- "grundgesetz"
- "bundestag"
- "wahlen"
- "parteien"
weak:
- "rechte"
- "pflichten"
- "institutionen"
negative:
- "europaeische union" # zu allgemein
Geographie:
strong:
- "geographie"
- "geografie"
- "erdkunde"
- "topographie"
- "klimazonen"
- "plattentektonik"
weak:
- "karte"
- "landschaft"
- "kontinent"
negative: []
Religion_Ethik:
strong:
- "religionsunterricht"
- "ethik"
- "philosophie"
- "weltreligionen"
- "bibel"
- "christentum"
- "islam"
- "judentum"
weak:
- "werte"
- "moral"
negative: []
Kunst:
strong:
- "kunstunterricht"
- "bildende kunst"
- "malerei"
- "zeichnen"
- "gestaltung"
- "kunstgeschichte"
weak:
- "bild"
- "farbe"
negative:
- "kunststoff"
Musik:
strong:
- "musikunterricht"
- "musiktheorie"
- "notenlehre"
- "rhythmus"
- "harmonie"
- "instrument"
weak:
- "lied"
- "melodie"
negative: []
Sport:
strong:
- "sportunterricht"
- "bewegung sport"
- "leichtathletik"
- "ballsport"
- "turnen"
- "schwimmen unterricht"
weak:
- "spiel"
- "fitness"
negative:
- "sportlich"
- "esport"
Wirtschaft:
strong:
- "wirtschaftsunterricht"
- "oekonomie"
- "volkswirtschaft"
- "betriebswirtschaft"
- "marktwirtschaft"
weak:
- "unternehmen"
- "markt"
negative: []
Sachunterricht:
strong:
- "sachunterricht"
- "heimat- und sachunterricht"
- "hsu"
weak:
- "grundschule thema"
negative: []
DaZ_DaF:
strong:
- "deutsch als zweitsprache"
- "deutsch als fremdsprache"
- "daz"
- "daf"
- "alphabetisierung"
weak:
- "sprachfoerderung"
- "integration"
negative: []
# Threshold für Subject-Assignment
threshold: 4 # Mindest-Score um Subject zuzuweisen
max_subjects: 3 # Maximal 3 Subjects pro Dokument