bartwisch commited on
Commit
aff88fb
·
1 Parent(s): b10e8ac

fix: ensure 3-channel input for PaddleOCR

Browse files
Files changed (1) hide show
  1. src/ocr_handler.py +8 -1
src/ocr_handler.py CHANGED
@@ -218,6 +218,10 @@ class OCRHandler:
218
  """Detect text using Manga-OCR - specialized for manga/comic fonts."""
219
  manga_ocr, detector = self._load_manga_ocr()
220
 
 
 
 
 
221
  # Use PaddleOCR for detection, then manga-ocr for recognition
222
  detection_result = detector.ocr(processed_image)
223
 
@@ -274,7 +278,10 @@ class OCRHandler:
274
  """Detect text using PaddleOCR - fast and general purpose."""
275
  reader = self._load_paddleocr()
276
 
277
- # PaddleOCR expects BGR or RGB numpy array
 
 
 
278
  result = reader.ocr(processed_image)
279
 
280
  final_results = []
 
218
  """Detect text using Manga-OCR - specialized for manga/comic fonts."""
219
  manga_ocr, detector = self._load_manga_ocr()
220
 
221
+ # Ensure 3-channel image for PaddleOCR/PaddleX doc preprocessor
222
+ if len(processed_image.shape) == 2:
223
+ processed_image = np.stack([processed_image] * 3, axis=-1)
224
+
225
  # Use PaddleOCR for detection, then manga-ocr for recognition
226
  detection_result = detector.ocr(processed_image)
227
 
 
278
  """Detect text using PaddleOCR - fast and general purpose."""
279
  reader = self._load_paddleocr()
280
 
281
+ # PaddleOCR expects 3-channel BGR/RGB numpy array
282
+ if len(processed_image.shape) == 2:
283
+ processed_image = np.stack([processed_image] * 3, axis=-1)
284
+
285
  result = reader.ocr(processed_image)
286
 
287
  final_results = []