From 41ff7671cd812b046ae43a1759f897b1b17958eb Mon Sep 17 00:00:00 2001 From: Benjamin Admin Date: Fri, 13 Mar 2026 09:39:33 +0100 Subject: [PATCH] fix: update PaddleOCR init for v3.4+ API (lang=en, ocr_version=PP-OCRv5) PaddleOCR 3.4.0 removed 'latin' language support. Use 'en' with explicit ocr_version='PP-OCRv5' instead, with fallback for older API. Co-Authored-By: Claude Opus 4.6 --- paddleocr-service/main.py | 19 ++++++++++++++----- 1 file changed, 14 insertions(+), 5 deletions(-) diff --git a/paddleocr-service/main.py b/paddleocr-service/main.py index 1195c5e..c6e3899 100644 --- a/paddleocr-service/main.py +++ b/paddleocr-service/main.py @@ -18,11 +18,20 @@ def get_engine(): if _engine is None: from paddleocr import PaddleOCR - _engine = PaddleOCR( - lang="latin", - use_angle_cls=True, - show_log=False, - ) + # PaddleOCR >= 3.x: use ocr_version param; fallback for older API + try: + _engine = PaddleOCR( + lang="en", + ocr_version="PP-OCRv5", + use_angle_cls=True, + show_log=False, + ) + except (ValueError, TypeError): + _engine = PaddleOCR( + lang="latin", + use_angle_cls=True, + show_log=False, + ) return _engine