Spaces:

Beat03
/

ocr

Running

App Files Files Community

Beat03 commited on Mar 5, 2025

Commit

e2c5a1e

verified ·

1 Parent(s): ad3e865

Upload 2 files

Browse files

Files changed (2) hide show

app.py +65 -0
requirements.txt +5 -0

app.py ADDED Viewed

	@@ -0,0 +1,65 @@

+import gradio as gr
+import requests
+import base64
+import io
+from PIL import Image
+import numpy as np
+from zhipuai import ZhipuAI
+# Thay API Key của bạn tại đây
+API_KEY = "d659608f7d5d42b1821a9303fc50b618.NesCuIytwpxjxpBJ"
+# Khởi tạo ZhipuAI client
+client = ZhipuAI(api_key=API_KEY)
+def extract_text(image):
+    if isinstance(image, np.ndarray):  # Chuyển NumPy array thành ảnh
+        image = Image.fromarray(image)
+    # Chuyển đổi ảnh sang Base64
+    buffered = io.BytesIO()
+    image.save(buffered, format="PNG")
+    image_base64 = base64.b64encode(buffered.getvalue()).decode("utf-8")
+    # Gửi yêu cầu đến GLM-4V
+    response = client.chat.completions.create(
+        model="glm-4v-plus",
+        messages=[
+            {
+                "role": "user",
+                "content": [
+                    {"type": "image_url", "image_url": {"url": f"data:image/png;base64,{image_base64}"}},
+                    {"type": "text", "text": "Hãy trích xuất toàn bộ chữ viết tay trong ảnh, giữ nguyên dấu câu, giữ dấu của từng chữ, khoảng cách dòng, và chính tả như trong ảnh."}
+                ]
+            }
+        ]
+    )
+    # Xử lý phản hồi từ API
+    if response and response.choices:
+        text = response.choices[0].message.content
+        output_text_file = "output.md"
+        with open(output_text_file, "w", encoding="utf-8") as f:
+            f.write(text)
+        output_image_file = "output_image.png"
+        image.save(output_image_file, format="PNG")
+        return text, output_text_file, output_image_file
+    else:
+        return "Lỗi: Không nhận được kết quả từ API.", None, None
+demo = gr.Interface(
+    fn=extract_text,
+    inputs="image",
+    outputs=[
+        "text",
+        gr.File(label="Tải xuống file văn bản (output.md)"),
+        gr.File(label="Tải xuống ảnh gốc (output_image.png)")
+    ],
+    title="Vietnamese Handwriting OCR",
+    description="Upload an image to extract handwritten text using ZhipuAI's GLM-4V model."
+)
+if __name__ == "__main__":
+    demo.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+gradio
+zhipuai
+pillow
+numpy
+requests