Spaces:

Banafo
/

Kroko-Streaming-ASR-Python

Runtime error

Banafo commited on Feb 3, 2025

Commit

669d22d

verified ·

1 Parent(s): 80efd26

Update app.py

Fix for Safari microphone

Files changed (1) hide show

app.py CHANGED Viewed

@@ -83,7 +83,13 @@ def transcribe_audio_online_streaming(file, language):
         while recognizer.is_ready(s):
             recognizer.decode_streams([s])
-        yield recognizer.get_result(s)
     except Exception as e:
         yield f"Error: {e}"
@@ -112,6 +118,8 @@ def transcribe_microphone_stream(audio_chunk, stream_state, language):
             return "", None
         sample_rate, waveform_np = audio_chunk
         # Resample if needed
         if sample_rate != 16000:
@@ -133,6 +141,11 @@ def transcribe_microphone_stream(audio_chunk, stream_state, language):
             recognizer.decode_streams([stream_state])
         current_text = recognizer.get_result(stream_state)
         return current_text, stream_state

         while recognizer.is_ready(s):
             recognizer.decode_streams([s])
+        current_text = recognizer.get_result(s)
+        if isinstance(current_text, (list, np.ndarray)):
+            current_text = " ".join(map(str, current_text))
+        elif isinstance(current_text, bytes):
+            current_text = current_text.decode("utf-8", errors="ignore")
+        yield current_text
     except Exception as e:
         yield f"Error: {e}"
             return "", None
         sample_rate, waveform_np = audio_chunk
+        if len(waveform_np.shape) > 1:
+            waveform_np = waveform_np.mean(axis=1)
         # Resample if needed
         if sample_rate != 16000:
             recognizer.decode_streams([stream_state])
         current_text = recognizer.get_result(stream_state)
+        if isinstance(current_text, (list, np.ndarray)):
+            current_text = " ".join(map(str, current_text))
+        elif isinstance(current_text, bytes):
+            current_text = current_text.decode("utf-8", errors="ignore")
         return current_text, stream_state