Spaces:

eoeooe
/

Gooo

Runtime error

File size: 2,115 Bytes

73ce55c
f335c05
73ce55c
 
 
3702ff7
6b549b4
 
 
73ce55c
3702ff7
6b549b4
 
 
 
 
 
 
73ce55c
6b549b4
73ce55c
 
 
 
6b549b4
 
73ce55c
 
6b549b4
73ce55c
 
 
 
1ee2fbb
 
 
 
73ce55c
1c78297
6b549b4
1c78297
73ce55c
6b549b4
73ce55c
6b549b4
 
3fe8c41
 
48f6c81

import pytesseract
from PIL import Image
import gradio as gr
from transformers import AutoTokenizer, AutoModelForSequenceClassification
import torch

# ✅ โมเดลนี้โหลดได้จริง + พร้อมใช้งาน
model_name = "thainlp/bert-base-thai-snips"
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForSequenceClassification.from_pretrained(model_name)

# Label map จากโมเดล (SNIPS dataset มี intent เช่น สั่งอาหาร, ตรวจอากาศ)
labels = [
    "AddToPlaylist", "BookRestaurant", "GetWeather",
    "PlayMusic", "RateBook", "SearchCreativeWork",
    "SearchScreeningEvent"
]

def ocr_and_classify(image):
    # OCR อ่านข้อความไทย + อังกฤษ
    text = pytesseract.image_to_string(image, lang="tha+eng")
    
    if not text.strip():
        return "❌ ไม่พบข้อความในภาพ"

    # วิเคราะห์ข้อความด้วย BERT
    inputs = tokenizer(text, return_tensors="pt", truncation=True, padding=True)
    outputs = model(**inputs)

    probs = torch.nn.functional.softmax(outputs.logits, dim=-1)
    pred_class_idx = torch.argmax(probs).item()
    confidence = probs[0][pred_class_idx].item()

    result = (
        f"📄 ข้อความที่อ่านได้:\n{text}\n\n"
        f"📝 การจำแนกข้อความ:\n{labels[pred_class_idx]} (ความมั่นใจ {confidence:.2%})"
    )
    return result

# Gradio UI
iface = gr.Interface(
    fn=ocr_and_classify,
    inputs=gr.Image(type="pil", label="อัปโหลดภาพ"),
    outputs=gr.Textbox(lines=15, label="ผลลัพธ์"),
    title="OCR + วิเคราะห์ข้อความด้วย BERT (Thai)",
    description="อ่านข้อความจากภาพด้วย pytesseract แล้ววิเคราะห์ด้วย BERT ที่รองรับภาษาไทย"
)

if __name__ == "__main__":
    iface.launch()