Restructure: Move 47 cv_* files into ocr/ package
Some checks failed
CI / go-lint (push) Has been skipped
CI / python-lint (push) Has been skipped
CI / nodejs-lint (push) Has been skipped
CI / test-go-school (push) Successful in 39s
CI / test-go-edu-search (push) Successful in 29s
CI / test-python-klausur (push) Failing after 2m34s
CI / test-python-agent-core (push) Successful in 20s
CI / test-nodejs-website (push) Successful in 26s

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
This commit is contained in:
Benjamin Admin
2026-04-25 21:03:54 +02:00
parent 45287b3541
commit cb1be59e46
95 changed files with 317 additions and 103 deletions

View File

@@ -24,7 +24,7 @@ from typing import Any, Dict, List, Optional, Tuple
import numpy as np
from cv_vocab_types import (
from ..types import (
IPA_AVAILABLE,
PageRegion,
RowGeometry,
@@ -47,7 +47,7 @@ except ImportError:
# ── Re-exports from sub-modules (backward compatibility) ──────────────────
from cv_ocr_word_assembly import ( # noqa: F401
from .word_assembly import ( # noqa: F401
_group_words_into_lines,
_words_to_reading_order_lines,
_rejoin_hyphenated,
@@ -55,7 +55,7 @@ from cv_ocr_word_assembly import ( # noqa: F401
_words_to_spaced_text,
)
from cv_ocr_vocab_postprocess import ( # noqa: F401
from .vocab_postprocess import ( # noqa: F401
_CHAR_CONFUSION_RULES,
_DE_INDICATORS_FOR_EN_I,
_fix_character_confusion,
@@ -66,7 +66,7 @@ from cv_ocr_vocab_postprocess import ( # noqa: F401
_attach_example_sentences,
)
from cv_ocr_ipa_lookup import ( # noqa: F401
from .ipa_lookup import ( # noqa: F401
_PHONETIC_BRACKET_RE,
_IPA_CHARS,
_MIN_WORD_CONF,
@@ -80,20 +80,20 @@ from cv_ocr_ipa_lookup import ( # noqa: F401
_insert_missing_ipa,
)
from cv_ocr_ipa_repair import ( # noqa: F401
from .ipa_repair import ( # noqa: F401
_has_non_dict_trailing,
_strip_post_bracket_garbled,
fix_ipa_continuation_cell,
_insert_headword_ipa,
)
from cv_ocr_cell_phonetics import ( # noqa: F401
from .cell_phonetics import ( # noqa: F401
fix_cell_phonetics,
_has_ipa_gap,
_sync_word_boxes_after_ipa_insert,
)
from cv_ocr_cell_filter import ( # noqa: F401
from .cell_filter import ( # noqa: F401
_RE_REAL_WORD,
_RE_ALPHA,
_COMMON_SHORT_WORDS,