Spaces:

Sabari231024
/

VISPA2

Sleeping

Sabari231024 commited on Oct 25, 2023

Commit

c9b1147

1 Parent(s): 3c3aa88

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,6 +7,7 @@ from googletrans import Translator
 import cv2
 import numpy as np
 import tempfile
 def trans(text, lang='ta'):
     translator = Translator()
@@ -37,16 +38,27 @@ def object_recognition(image_array, lang):
     return audio_file
 def ocr_detection(image_array, lang):
-    # Convert the NumPy array to PIL Image
     image = Image.fromarray(image_array)
-    client = Client("https://kneelesh48-tesseract-ocr.hf.space/")
-    result = client.predict(image, "afr", api_name="/tesseract-ocr")
-    print(result)
-    text = "OCR detection result for the captured image."
-    audio_file = trans(result, lang)
     return audio_file
 def operator(image_array, value, lang):
     if value == "1":
         audio_file = object_recognition(image_array, lang)

 import cv2
 import numpy as np
 import tempfile
+import base64
 def trans(text, lang='ta'):
     translator = Translator()
     return audio_file
 def ocr_detection(image_array, lang):
     image = Image.fromarray(image_array)
+    buffered = BytesIO()
+    image.save(buffered, format="PNG")
+    image_base64 = base64.b64encode(buffered.getvalue()).decode()
+    response = requests.post("https://pragnakalp-ocr-image-to-text.hf.space/run/predict", json={
+        "data": [
+            "PaddleOCR",
+            f"data:image/png;base64,{image_base64}",
+        ]
+    }).json()
+    data = response.get("data", [])
+    text = " ".join(data)
+    audio_file = trans(text, lang)
     return audio_file
 def operator(image_array, value, lang):
     if value == "1":
         audio_file = object_recognition(image_array, lang)