Spaces:

gaurannggg7
/

Signlink

Running

App Files Files Community

gaurannggg7 commited on 4 days ago

Commit

4f2f9ba

verified ·

1 Parent(s): 2ca0c8e

Update whisper_transcribe.py

Browse files

Files changed (1) hide show

whisper_transcribe.py +1 -77

whisper_transcribe.py CHANGED Viewed

@@ -1,6 +1,4 @@
 import os
-import sounddevice as sd
-import soundfile as sf
 import tempfile
 import whisper
 from utils import get_best_device
@@ -39,78 +37,4 @@ def transcribe_file(path: str, model_name: str = WHISPER_MODEL_NAME) -> str:
         result = model.transcribe(path, fp16=False)
         return result.get("text", "").strip()
     except Exception as e:
-        raise RuntimeError(f"Whisper transcription failed: {e}")
-def list_input_devices():
-    """
-    Return a list of (index, name) for all input-capable audio devices.
-    """
-    devices = sd.query_devices()
-    return [(i, d.get('name', '')) for i, d in enumerate(devices) if d.get('max_input_channels', 0) > 0]
-def record_audio(duration: int, sr: int = 16000, device_index: int = None) -> tuple[int, list[float]]:
-    """
-    Record `duration` seconds of mono audio at sample rate `sr`.
-    Automatically selects a valid input device if none is provided.
-    Raises RuntimeError on failure.
-    """
-    devices = list_input_devices()
-    if not devices:
-        raise RuntimeError("No input audio devices found.")
-    # Choose device: user-specified or default, else first available
-    if device_index is None:
-        default = sd.default.device
-        if isinstance(default, (tuple, list)) and default[0] is not None:
-            device_index = default[0]
-        else:
-            device_index = devices[0][0]
-    # Validate device
-    if device_index not in [i for i, _ in devices]:
-        device_index = devices[0][0]
-    # Configure recorder
-    sd.default.device = (device_index, None)
-    sd.default.samplerate = sr
-    sd.default.channels = 1
-    print(f"Recording {duration}s at {sr}Hz from device #{device_index}…")
-    try:
-        data = sd.rec(int(duration * sr), dtype='float32', channels=1)
-        sd.wait()
-    except Exception as e:
-        raise RuntimeError(f"Audio recording failed: {e}")
-    # Convert to 1D float32 list
-    wav = data.flatten().tolist()
-    return sr, wav
-def transcribe_from_mic(duration: int) -> str:
-    """
-    Record `duration` seconds from the microphone, save to a temp WAV, transcribe, then clean up.
-    Raises RuntimeError on recording or transcription errors.
-    """
-    try:
-        sr, wav = record_audio(duration)
-    except Exception as e:
-        raise RuntimeError(f"Microphone recording error: {e}")
-    # Write to temporary WAV file
-    with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmp:
-        tmp_path = tmp.name
-        sf.write(tmp_path, wav, sr)
-    try:
-        text = transcribe_file(tmp_path)
-    finally:
-        # Ensure cleanup
-        try:
-            os.remove(tmp_path)
-        except OSError:
-            pass
-    return text

 import os
 import tempfile
 import whisper
 from utils import get_best_device
         result = model.transcribe(path, fp16=False)
         return result.get("text", "").strip()
     except Exception as e:
+        raise RuntimeError(f"Whisper transcription failed: {e}")