Spaces:
Running on Zero
Running on Zero
bartwisch commited on
Commit ·
aff88fb
1
Parent(s): b10e8ac
fix: ensure 3-channel input for PaddleOCR
Browse files- src/ocr_handler.py +8 -1
src/ocr_handler.py
CHANGED
|
@@ -218,6 +218,10 @@ class OCRHandler:
|
|
| 218 |
"""Detect text using Manga-OCR - specialized for manga/comic fonts."""
|
| 219 |
manga_ocr, detector = self._load_manga_ocr()
|
| 220 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 221 |
# Use PaddleOCR for detection, then manga-ocr for recognition
|
| 222 |
detection_result = detector.ocr(processed_image)
|
| 223 |
|
|
@@ -274,7 +278,10 @@ class OCRHandler:
|
|
| 274 |
"""Detect text using PaddleOCR - fast and general purpose."""
|
| 275 |
reader = self._load_paddleocr()
|
| 276 |
|
| 277 |
-
# PaddleOCR expects
|
|
|
|
|
|
|
|
|
|
| 278 |
result = reader.ocr(processed_image)
|
| 279 |
|
| 280 |
final_results = []
|
|
|
|
| 218 |
"""Detect text using Manga-OCR - specialized for manga/comic fonts."""
|
| 219 |
manga_ocr, detector = self._load_manga_ocr()
|
| 220 |
|
| 221 |
+
# Ensure 3-channel image for PaddleOCR/PaddleX doc preprocessor
|
| 222 |
+
if len(processed_image.shape) == 2:
|
| 223 |
+
processed_image = np.stack([processed_image] * 3, axis=-1)
|
| 224 |
+
|
| 225 |
# Use PaddleOCR for detection, then manga-ocr for recognition
|
| 226 |
detection_result = detector.ocr(processed_image)
|
| 227 |
|
|
|
|
| 278 |
"""Detect text using PaddleOCR - fast and general purpose."""
|
| 279 |
reader = self._load_paddleocr()
|
| 280 |
|
| 281 |
+
# PaddleOCR expects 3-channel BGR/RGB numpy array
|
| 282 |
+
if len(processed_image.shape) == 2:
|
| 283 |
+
processed_image = np.stack([processed_image] * 3, axis=-1)
|
| 284 |
+
|
| 285 |
result = reader.ocr(processed_image)
|
| 286 |
|
| 287 |
final_results = []
|