Spaces:

meissosisai
/

Codeai

Sleeping

zhlajiex commited on Jan 28

Commit

ed58206

1 Parent(s): 1856281

Feat: Support .heic image format for OCR

Files changed (3) hide show

Dockerfile CHANGED Viewed

@@ -21,7 +21,7 @@ ENV PATH="$VIRTUAL_ENV/bin:$PATH"
 # Install PaddleOCR and Dependencies
 # This might take a while to build/download
-RUN pip install --no-cache-dir paddlepaddle paddleocr
 # Set working directory
 WORKDIR /app

 # Install PaddleOCR and Dependencies
 # This might take a while to build/download
+RUN pip install --no-cache-dir paddlepaddle paddleocr pillow pillow-heif
 # Set working directory
 WORKDIR /app

backend/services/paddle_ocr.py CHANGED Viewed

@@ -1,18 +1,23 @@
 import sys
 import os
 import logging
 # Disable heavy logging from Paddle
 os.environ['GLOG_minloglevel'] = '3'
 try:
     from paddleocr import PaddleOCR
 except ImportError:
-    print("Error: paddleocr not installed. Please run 'pip install paddleocr paddlepaddle'")
     sys.exit(1)
 # Initialize OCR engine
-# lang='en' is default. use_angle_cls=True helps with rotated text
 ocr = PaddleOCR(use_angle_cls=True, lang='en', show_log=False)
 def process_image(img_path):
@@ -21,16 +26,26 @@ def process_image(img_path):
         sys.exit(1)
     try:
-        result = ocr.ocr(img_path, cls=True)
         full_text = []
-        # Result structure: [ [ [ [x1,y1],[x2,y2].. ], ("text", conf) ], ... ]
         if result and result[0]:
             for line in result[0]:
                 text = line[1][0]
                 full_text.append(text)
-        # Output strictly the text to stdout for Node.js to capture
         print("\n".join(full_text))
     except Exception as e:
@@ -42,4 +57,4 @@ if __name__ == "__main__":
         print("Usage: python paddle_ocr.py <image_path>")
         sys.exit(1)
-    process_image(sys.argv[1])

 import sys
 import os
 import logging
+import numpy as np
 # Disable heavy logging from Paddle
 os.environ['GLOG_minloglevel'] = '3'
 try:
     from paddleocr import PaddleOCR
+    from PIL import Image
+    import pillow_heif
 except ImportError:
+    print("Error: Missing dependencies. Run 'pip install paddleocr paddlepaddle pillow pillow-heif'")
     sys.exit(1)
+# Register HEIC opener
+pillow_heif.register_heif_opener()
 # Initialize OCR engine
 ocr = PaddleOCR(use_angle_cls=True, lang='en', show_log=False)
 def process_image(img_path):
         sys.exit(1)
     try:
+        # Check extension for HEIC handling
+        ext = os.path.splitext(img_path)[1].lower()
+        img_input = img_path
+        # If HEIC, load with Pillow and convert to numpy array (RGB)
+        if ext == '.heic':
+            image = Image.open(img_path)
+            if image.mode != 'RGB':
+                image = image.convert('RGB')
+            img_input = np.array(image)
+        result = ocr.ocr(img_input, cls=True)
         full_text = []
         if result and result[0]:
             for line in result[0]:
                 text = line[1][0]
                 full_text.append(text)
         print("\n".join(full_text))
     except Exception as e:
         print("Usage: python paddle_ocr.py <image_path>")
         sys.exit(1)
+    process_image(sys.argv[1])

backend/utils/fileProcessor.js CHANGED Viewed

@@ -11,7 +11,7 @@ exports.processFile = async (filePath) => {
   let content = '';
   try {
-    if (['.png', '.jpg', '.jpeg', '.webp'].includes(ext)) {
       // Process image with Local PaddleOCR
       console.log(`[PaddleOCR] Initiating local analysis for: ${fileName}...`);

   let content = '';
   try {
+    if (['.png', '.jpg', '.jpeg', '.webp', '.heic'].includes(ext)) {
       // Process image with Local PaddleOCR
       console.log(`[PaddleOCR] Initiating local analysis for: ${fileName}...`);