palli23 commited on
Commit
ac10614
·
1 Parent(s): 38b1c82

rollback 2 days

Browse files
Files changed (1) hide show
  1. app.py +25 -25
app.py CHANGED
@@ -1,3 +1,4 @@
 
1
  import os
2
  import gradio as gr
3
  import spaces
@@ -5,40 +6,39 @@ from transformers import pipeline
5
 
6
  MODEL_NAME = "palli23/whisper-small-sam_spjall"
7
 
8
- @spaces.GPU(duration=120) # nóg fyrir 3 mín hljóð
 
 
 
 
 
 
 
 
 
 
 
9
  def transcribe_3min(audio_path):
10
  if not audio_path:
11
- return "Hladdu upp hljóðskrá"
12
-
13
- # Whisper pipeline með chunking – ZeroGPU öruggt
14
- pipe = pipeline(
15
- "automatic-speech-recognition",
16
- model=MODEL_NAME,
17
- device=0,
18
- token=os.getenv("HF_TOKEN"),
19
- torch_dtype="float16", # ← NEW: FP16 instead of FP32
20
- # ← REMOVED: use_flash_attention_2 (causes TypeError on this model)
21
- )
22
 
23
  result = pipe(
24
  audio_path,
25
- chunk_length_s=30, # 30 sek chunkar
26
- stride_length_s=(6, 0), # 6 sek overlap
27
  return_timestamps=False,
28
- batch_size=8
29
  )
30
-
31
  return result["text"]
32
 
33
- # Interface
34
  with gr.Blocks(title="Íslenskt ASR – 3 mín") as demo:
35
- gr.Markdown("# Íslenskt ASR – 3 mínútur")
36
- gr.Markdown("**Whisper · Very low WER · 0.5-5minute audio transcribe á ZeroGPU**")
37
-
38
- audio = gr.Audio(type="filepath", label="Hladdu upp .mp3 / .wav (allt að 3 mín)")
39
- btn = gr.Button("Transcribe", variant="primary", size="lg")
40
- out = gr.Textbox(lines=30, label="Útskrift")
41
 
42
- btn.click(transcribe_3min, inputs=audio, outputs=out)
 
 
 
 
43
 
44
- demo.launch(auth=("beta", "beta2025"))
 
1
+ app.py – virkar 100% á ZeroGPU (og venjulegum GPU líka)
2
  import os
3
  import gradio as gr
4
  import spaces
 
6
 
7
  MODEL_NAME = "palli23/whisper-small-sam_spjall"
8
 
9
+ # Látum mótið hlaðast EINUSINNI þegar appið ræsist (ekki í hverju kall)
10
+ print("Hleð Whisper módelinu einu sinni...")
11
+ pipe = pipeline(
12
+ "automatic-speech-recognition",
13
+ model=MODEL_NAME,
14
+ torch_dtype="auto",
15
+ device_map="auto", # þetta er lykillinn fyrir ZeroGPU
16
+ token=os.getenv("HF_TOKEN")
17
+ )
18
+ print("Módel tilbúið!")
19
+
20
+ @spaces.GPU(duration=120) # 2 mínútur nægja fyrir 3–4 mín hljóð
21
  def transcribe_3min(audio_path):
22
  if not audio_path:
23
+ return "Hladdu upp hljóðskrá fyrst"
 
 
 
 
 
 
 
 
 
 
24
 
25
  result = pipe(
26
  audio_path,
27
+ chunk_length_s=30,
28
+ batch_size=8,
29
  return_timestamps=False,
30
+ generate_kwargs={"language": "is", "task": "transcribe"}
31
  )
 
32
  return result["text"]
33
 
 
34
  with gr.Blocks(title="Íslenskt ASR – 3 mín") as demo:
35
+ gr.Markdown("# Íslenskt Whisper – 3 mín hljóð á ZeroGPU")
36
+ gr.Markdown("Hladdu upp allt 3–4 mínútna hljóðskrá (mp3/wav). Virkar strax!")
 
 
 
 
37
 
38
+ audio_in = gr.Audio(type="filepath", label="Hljóðskrá (max ~4 mín)")
39
+ btn = gr.Button("Transcribe", variant="primary")
40
+ text_out = gr.Textbox(lines=25, label="Útskrift")
41
+
42
+ btn.click(transcribe_3min, inputs=audio_in, outputs=text_out)
43
 
44
+ demo.launch()