captchabreaker

Runtime error

App Files Files Community

golyew commited on Sep 9, 2025

Commit

faca012

verified ·

1 Parent(s): 31b5da1

Update app.py

Browse files

Files changed (1) hide show

app.py +22 -14

app.py CHANGED Viewed

@@ -4,25 +4,33 @@ from PIL import Image
 import numpy as np
 from tokenizer_base import Tokenizer
 import gradio as gr
-from huggingface_hub import Repository
 # Параметры модели
 model_file = "captcha.onnx"
-img_size = (32,128)
 charset = r"0123456789abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ!\"#$%&'()*+,-./:;<=>?@[\\]^_`{|}~"
 tokenizer_base = Tokenizer(charset)
-# Преобразования изображения (замена torchvision)
 def preprocess_image(img, img_size):
-    # resize с bicubic
     img = img.resize(img_size, Image.BICUBIC)
-    # в numpy (HWC → CHW)
     img = np.array(img).astype(np.float32) / 255.0
-    img = np.transpose(img, (2, 0, 1))  # (H,W,C) → (C,H,W)
-    # нормализация (x-mean)/std, тут mean=0.5, std=0.5
     img = (img - 0.5) / 0.5
-    # добавляем batch dim
     img = np.expand_dims(img, axis=0)
     return img
 # softmax на numpy
@@ -37,22 +45,22 @@ def initialize_model(model_file):
     ort_session = rt.InferenceSession(model_file)
     return ort_session
-# Функция для распознавания текста на изображении
 def get_text(img_org):
-    x = preprocess_image(img_org.convert('RGB'), img_size)
     # Предсказание с помощью ONNX
     ort_inputs = {ort_session.get_inputs()[0].name: x}
     logits = ort_session.run(None, ort_inputs)[0]
-    probs = softmax(logits, axis=-1)  # Вычисляем вероятности
-    preds, probs = tokenizer_base.decode(probs)  # Декодируем результат
-    return preds[0]  # Берём первое предсказание
 # Инициализация модели
 ort_session = initialize_model(model_file=model_file)
-# Создание Gradio интерфейса
 def gradio_interface():
     return gr.Interface(
         fn=get_text,

 import numpy as np
 from tokenizer_base import Tokenizer
 import gradio as gr
 # Параметры модели
 model_file = "captcha.onnx"
+img_size = (32, 128)
 charset = r"0123456789abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ!\"#$%&'()*+,-./:;<=>?@[\\]^_`{|}~"
 tokenizer_base = Tokenizer(charset)
+# Надёжный препроцессинг
 def preprocess_image(img, img_size):
+    # Приводим к RGB (убираем альфу/градации серого)
+    img = img.convert("RGB")
+    # Resize bicubic
     img = img.resize(img_size, Image.BICUBIC)
+    # В numpy (HWC → float32)
     img = np.array(img).astype(np.float32) / 255.0
+    # HWC → CHW
+    img = np.transpose(img, (2, 0, 1))
+    # Нормализация (x-mean)/std
     img = (img - 0.5) / 0.5
+    # Добавляем batch размерность
     img = np.expand_dims(img, axis=0)
     return img
 # softmax на numpy
     ort_session = rt.InferenceSession(model_file)
     return ort_session
+# Функция для распознавания текста
 def get_text(img_org):
+    x = preprocess_image(img_org, img_size)
     # Предсказание с помощью ONNX
     ort_inputs = {ort_session.get_inputs()[0].name: x}
     logits = ort_session.run(None, ort_inputs)[0]
+    probs = softmax(logits, axis=-1)
+    preds, probs = tokenizer_base.decode(probs)
+    return preds[0]
 # Инициализация модели
 ort_session = initialize_model(model_file=model_file)
+# Gradio интерфейс
 def gradio_interface():
     return gr.Interface(
         fn=get_text,