Spaces:

Lesterchia1
/

FPOC2_AI-Tutor_Chatbot

Running

Chia Woon Yap commited on Oct 1, 2025

Commit

15bfc80

verified ·

1 Parent(s): a712245

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -264,13 +264,41 @@ def process_document(file):
         return f"Error processing document: {str(e)}"
 # Function to handle speech-to-text conversion
 def transcribe_audio(audio):
     sr, y = audio
     if y.ndim > 1:
         y = y.mean(axis=1)
     y = y.astype(np.float32)
-    y /= np.max(np.abs(y))
-    return transcriber({"sampling_rate": sr, "raw": y})["text"]
 # Clear chat history function
 def clear_chat_history():

         return f"Error processing document: {str(e)}"
 # Function to handle speech-to-text conversion
+#def transcribe_audio(audio):
+#    sr, y = audio
+#    if y.ndim > 1:
+#        y = y.mean(axis=1)
+#    y = y.astype(np.float32)
+#    y /= np.max(np.abs(y))
+#    return transcriber({"sampling_rate": sr, "raw": y})["text"]
+#Quick Fixes You Can Try First:
 def transcribe_audio(audio):
     sr, y = audio
     if y.ndim > 1:
         y = y.mean(axis=1)
     y = y.astype(np.float32)
+    # Improved normalization
+    max_val = np.max(np.abs(y))
+    if max_val > 0:
+        y /= max_val
+    # Use better model
+    better_transcriber = pipeline(
+        "automatic-speech-recognition",
+        model="openai/whisper-small.en",  # More accurate
+        chunk_length_s=30
+    )
+    return better_transcriber({"sampling_rate": sr, "raw": y})["text"]
+# the remaining is the same
 # Clear chat history function
 def clear_chat_history():