kj03 commited on
Commit
97afa3e
·
verified ·
1 Parent(s): 0999cd0

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -12
app.py CHANGED
@@ -1,23 +1,18 @@
1
  import gradio as gr
2
  from PIL import Image
3
- import torch
4
- from transformers import TrOCRProcessor, VisionEncoderDecoderModel
5
  from gtts import gTTS
 
6
  import tempfile
7
- import os
8
-
9
- # Load TrOCR model (OCR)
10
- processor = TrOCRProcessor.from_pretrained("microsoft/trocr-base-stage1")
11
- ocr_model = VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-base-stage1")
12
 
13
  def bangla_reader(image):
14
  if image is None:
15
  return "কোনো ছবি দেওয়া হয়নি।", None
16
 
17
- # Step 1: OCR
18
- pixel_values = processor(images=image, return_tensors="pt").pixel_values
19
- generated_ids = ocr_model.generate(pixel_values)
20
- ocr_text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
 
21
 
22
  # Step 2: gTTS Bangla
23
  try:
@@ -28,7 +23,7 @@ def bangla_reader(image):
28
  except Exception as e:
29
  return f"OCR সফল হয়েছে, কিন্তু TTS ব্যর্থ: {str(e)}", None
30
 
31
- return f"OCR ফলাফল:\n{ocr_text}", audio_path
32
 
33
  # Gradio UI
34
  demo = gr.Interface(
 
1
  import gradio as gr
2
  from PIL import Image
 
 
3
  from gtts import gTTS
4
+ import pytesseract
5
  import tempfile
 
 
 
 
 
6
 
7
  def bangla_reader(image):
8
  if image is None:
9
  return "কোনো ছবি দেওয়া হয়নি।", None
10
 
11
+ # Step 1: OCR using Tesseract (Bangla)
12
+ ocr_text = pytesseract.image_to_string(image, lang='ben')
13
+
14
+ if not ocr_text.strip():
15
+ return "কোনো লেখা সনাক্ত করা যায়নি।", None
16
 
17
  # Step 2: gTTS Bangla
18
  try:
 
23
  except Exception as e:
24
  return f"OCR সফল হয়েছে, কিন্তু TTS ব্যর্থ: {str(e)}", None
25
 
26
+ return f"OCR ফলাফল:\n{ocr_text.strip()}", audio_path
27
 
28
  # Gradio UI
29
  demo = gr.Interface(