Spaces:

UpCoder
/

stt-uzbek

Runtime error

UpCoder commited on Mar 9

Commit

354dd60

verified ·

1 Parent(s): fbe7334

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -12,6 +12,7 @@ def assess_pronunciation(audio_filepath, target_text):
     if not audio_filepath or not target_text:
         return {"error": "Missing input"}
     try:
         # 1. Transcribe the audio
         result = asr_pipe(audio_filepath)
@@ -19,14 +20,12 @@ def assess_pronunciation(audio_filepath, target_text):
         target_clean = target_text.lower().strip()
         # 2. Calculate Accuracy (String similarity)
-        # This acts as a 'Goodness of Pronunciation' proxy
         accuracy = SequenceMatcher(None, target_clean, student_said).ratio() * 100
         # 3. Calculate Fluency (Words per second)
         audio, sr = librosa.load(audio_filepath)
         duration = librosa.get_duration(y=audio, sr=sr)
         words_count = len(student_said.split())
-        # Heuristic: 120 WPM is native fluency
         fluency = min(100, (words_count / max(duration, 1)) * 40)
         return {
@@ -38,7 +37,7 @@ def assess_pronunciation(audio_filepath, target_text):
     except Exception as e:
         return {"error": str(e)}
-# Interface set to Gradio 3 standards for simple API calls
 interface = gr.Interface(
     fn=assess_pronunciation,
     inputs=[gr.Audio(source="upload", type="filepath"), gr.Textbox(label="Target Text")],

     if not audio_filepath or not target_text:
         return {"error": "Missing input"}
+    # --- MAKE SURE THIS 'TRY' IS NOT INDENTED INSIDE THE 'IF' ABOVE ---
     try:
         # 1. Transcribe the audio
         result = asr_pipe(audio_filepath)
         target_clean = target_text.lower().strip()
         # 2. Calculate Accuracy (String similarity)
         accuracy = SequenceMatcher(None, target_clean, student_said).ratio() * 100
         # 3. Calculate Fluency (Words per second)
         audio, sr = librosa.load(audio_filepath)
         duration = librosa.get_duration(y=audio, sr=sr)
         words_count = len(student_said.split())
         fluency = min(100, (words_count / max(duration, 1)) * 40)
         return {
     except Exception as e:
         return {"error": str(e)}
+# Gradio 3 Interface
 interface = gr.Interface(
     fn=assess_pronunciation,
     inputs=[gr.Audio(source="upload", type="filepath"), gr.Textbox(label="Target Text")],