ASR_API2

Sleeping

palli23 commited on Dec 3, 2025

Commit

6161422

1 Parent(s): abc601d

fix transcribe bug

Files changed (2) hide show

app.py CHANGED Viewed

@@ -5,7 +5,7 @@ from transformers import pipeline
 MODEL_NAME = "palli23/whisper-small-sam_spjall"
-print("Hleð módel...")
 pipe = pipeline(
     "automatic-speech-recognition",
@@ -15,25 +15,36 @@ pipe = pipeline(
     token=os.getenv("HF_TOKEN")
 )
-# Fix fyrir gamlar Whisper checkpointar (þarf ennþá)
-if not hasattr(pipe.model.generation_config, "lang_to_id"):
-    pipe.model.generation_config.lang_to_id = {"is": 50259}
-    pipe.model.generation_config.task_to_id = {"transcribe": 50359}
-    pipe.model.generation_config.forced_decoder_ids = None
-print("Módel tilbúið!")
-@spaces.GPU(duration=90)
-def transcribe(audio):
-    if not audio:
-        return "Hladdu upp skrá"
-    return pipe(audio, chunk_length_s=30, batch_size=16)["text"].strip()
-with gr.Blocks() as demo:
-    gr.Markdown("# Íslenskt Whisper – Virkar loksins")
-    inp = gr.Audio(type="filepath", label="Hljóðskrá (allt að 6 mín)")
-    btn = gr.Button("Transcribe", variant="primary")
-    out = gr.Textbox(label="Útskrift", lines=25)
-    btn.click(transcribe, inp, out)
 demo.launch(auth=("beta", "beta2025"))

 MODEL_NAME = "palli23/whisper-small-sam_spjall"
+print("Hleð Whisper small (T4 small – engin takmörk)")
 pipe = pipeline(
     "automatic-speech-recognition",
     token=os.getenv("HF_TOKEN")
 )
+# Þarf ekki lengur að laga gamla config – nýja transformers gerir það sjálft
+print("Módel tilbúið – allt virkar!")
+@spaces.GPU  # engin duration þarf lengur – þú borgar fyrir tímann
+def transcribe(audio_path):
+    if not audio_path:
+        return "Hladdu upp hljóðskrá"
+    result = pipe(audio_path, chunk_length_s=30, batch_size=16)
+    return result["text"].strip()
+with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    gr.Markdown("# Íslenskt Whisper – T4 small (mjög hratt & nákvæmt)")
+    with gr.Row():
+        audio = gr.Audio(
+            label="Hljóðskrá (allt að 15 mín)",
+            type="filepath",
+            waveform=True,           # virkar núna!
+            source="upload"
+        )
+    btn = gr.Button("Transcribe", variant="primary", size="lg")
+    with gr.Row():
+        timer = gr.Timer(label="Tími liðinn", active=True)
+    out = gr.Textbox(label="Útskrift", lines=28, show_copy_button=True)
+    btn.click(transcribe, audio, out).then(
+        lambda: gr.update(active=False), outputs=timer
+    )
 demo.launch(auth=("beta", "beta2025"))

requirements.txt CHANGED Viewed

@@ -1,6 +1,5 @@
-# requirements.txt – ONLY THIS WORKS on ZeroGPU right now
-gradio
-transformers
-spaces
 accelerate
-# DO NOT write any torch version here → ZeroGPU injects its own torch

+gradio>=4.44
+transformers>=4.45
+torch>=2.4
 accelerate
+spaces