Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -21,9 +21,9 @@ def bangla_reader(image):
|
|
| 21 |
generated_ids = model.generate(pixel_values)
|
| 22 |
ocr_text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
|
| 23 |
|
| 24 |
-
# TTS
|
| 25 |
with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmp:
|
| 26 |
-
tts.tts_to_file(text=ocr_text, file_path=tmp.name, language="bn"
|
| 27 |
audio_path = tmp.name
|
| 28 |
|
| 29 |
return f"OCR ফলাফল: {ocr_text}", audio_path
|
|
|
|
| 21 |
generated_ids = model.generate(pixel_values)
|
| 22 |
ocr_text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
|
| 23 |
|
| 24 |
+
# TTS (without speaker argument)
|
| 25 |
with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmp:
|
| 26 |
+
tts.tts_to_file(text=ocr_text, file_path=tmp.name, language="bn") # Removed speaker
|
| 27 |
audio_path = tmp.name
|
| 28 |
|
| 29 |
return f"OCR ফলাফল: {ocr_text}", audio_path
|