Spaces:

mkfallah
/

pasr

Sleeping

mkfallah commited on Sep 4, 2025

Commit

1e401c5

verified ·

1 Parent(s): 7a6ef6c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,8 +1,6 @@
 import gradio as gr
 from transformers import pipeline
 from rapidfuzz import process, fuzz
-import soundfile as sf
-import numpy as np
 # Initialize ASR pipeline
 asr = pipeline(
@@ -22,7 +20,6 @@ custom_vocab_map = {
 def replace_fuzzy(text, vocab_map, threshold=85):
     """
     Replace words/phrases in text using fuzzy matching with high threshold.
-    Supports multiple alternatives per word/phrase.
     """
     for target, alternatives in vocab_map.items():
         result = process.extractOne(text, alternatives, scorer=fuzz.partial_ratio)
@@ -39,12 +36,13 @@ def replace_fuzzy(text, vocab_map, threshold=85):
 def transcribe(audio_file):
     """
-    Handle audio input from Gradio (filepath from mic or upload).
     """
-    if audio_file is None:
         return "No audio input detected."
     try:
         result = asr(audio_file, chunk_length_s=30, stride_length_s=[5,5])
     except Exception as e:
         return f"ASR error: {e}"
@@ -59,8 +57,8 @@ iface = gr.Interface(
     inputs=gr.Audio(type="filepath", label="Record or upload audio"),
     outputs="text",
     title="Persian ASR with High Accuracy Vocabulary",
-    description="""Speak in Persian or upload an audio file;
-recognized words are corrected using a custom high-accuracy vocabulary."""
 )
 if __name__ == "__main__":

 import gradio as gr
 from transformers import pipeline
 from rapidfuzz import process, fuzz
 # Initialize ASR pipeline
 asr = pipeline(
 def replace_fuzzy(text, vocab_map, threshold=85):
     """
     Replace words/phrases in text using fuzzy matching with high threshold.
     """
     for target, alternatives in vocab_map.items():
         result = process.extractOne(text, alternatives, scorer=fuzz.partial_ratio)
 def transcribe(audio_file):
     """
+    audio_file: path to WAV file (Gradio mic or upload)
     """
+    if not audio_file:
         return "No audio input detected."
     try:
+        # Run ASR
         result = asr(audio_file, chunk_length_s=30, stride_length_s=[5,5])
     except Exception as e:
         return f"ASR error: {e}"
     inputs=gr.Audio(type="filepath", label="Record or upload audio"),
     outputs="text",
     title="Persian ASR with High Accuracy Vocabulary",
+    description="""Speak in Persian or upload an audio file; recognized words
+are corrected using a custom high-accuracy vocabulary."""
 )
 if __name__ == "__main__":