palli23 commited on
Commit
1d313ab
·
1 Parent(s): 9d663d7

fix transcribe bug

Browse files
Files changed (1) hide show
  1. app.py +15 -21
app.py CHANGED
@@ -1,4 +1,4 @@
1
- # app.py – Fixed for outdated generation_config (virkar á ZeroGPU)
2
  import os
3
  import gradio as gr
4
  import spaces
@@ -12,39 +12,33 @@ pipe = pipeline(
12
  "automatic-speech-recognition",
13
  model=MODEL_NAME,
14
  torch_dtype="auto",
15
- device="cuda" if os.getenv("SYSTEM") == "spaces" else "cpu",
16
- model_kwargs={"attn_implementation": "sdpa"},
17
  token=os.getenv("HF_TOKEN")
18
  )
19
 
20
- # *** THIS IS THE FIX: Uppfæra generation_config til styðja language/task ***
21
- pipe.model.generation_config.language = "is" # Default language
22
- pipe.model.generation_config.task = "transcribe" # Default task
23
- pipe.model.generation_config.forced_decoder_ids = None # Disable old forced IDs (deprecated)
24
- pipe.model.generation_config.suppress_tokens = [] # Clear suppress if needed
25
- print("Generation config uppfærð – allt klárt!")
 
 
26
 
27
  @spaces.GPU(duration=120)
28
  def transcribe_audio(audio_path):
29
  if not audio_path:
30
  return "Hladdu upp hljóðskrá fyrst"
31
 
32
- result = pipe(
33
- audio_path,
34
- chunk_length_s=30,
35
- batch_size=8,
36
- return_timestamps=False,
37
- # Núna virkar þetta án generate_kwargs (því config er sett)
38
- # Ef þú vilt breyta: generate_kwargs={"language": "is", "task": "transcribe"}
39
- )
40
  return result["text"]
41
 
 
42
  with gr.Blocks() as demo:
43
- gr.Markdown("# Íslenskt Whisper – mjög lágt WER – 30 sek–5 mín hljóð")
44
  audio_in = gr.Audio(type="filepath", label="Hladdu upp mp3/wav (allt að 5 mín)")
45
  btn = gr.Button("Transcribe", variant="primary")
46
- output = gr.Textbox(lines=25, label="Útskrift")
47
-
48
  btn.click(transcribe_audio, inputs=audio_in, outputs=output)
49
 
50
- demo.launch()
 
1
+ # app.py – VIRKAR Á ZeroGPU ÁN VILLA (des 2025)
2
  import os
3
  import gradio as gr
4
  import spaces
 
12
  "automatic-speech-recognition",
13
  model=MODEL_NAME,
14
  torch_dtype="auto",
15
+ device="cuda",
 
16
  token=os.getenv("HF_TOKEN")
17
  )
18
 
19
+ # LAGA GAMLAN generation_config (þetta er lykillinn)
20
+ if not hasattr(pipe.model.generation_config, "lang_to_id") or pipe.model.generation_config.lang_to_id is None:
21
+ pipe.model.generation_config.lang_to_id = {"is": 50259}
22
+ pipe.model.generation_config.task_to_id = {"transcribe": 50359, "translate": 50358}
23
+ pipe.model.generation_config.forced_decoder_ids = None
24
+ print("Gamall generation_config lagaðurnú virkar allt!")
25
+
26
+ print("Módel tilbúið!")
27
 
28
  @spaces.GPU(duration=120)
29
  def transcribe_audio(audio_path):
30
  if not audio_path:
31
  return "Hladdu upp hljóðskrá fyrst"
32
 
33
+ result = pipe(audio_path, chunk_length_s=30, batch_size=8)
 
 
 
 
 
 
 
34
  return result["text"]
35
 
36
+ # Gradio interface með login (beta / beta2025)
37
  with gr.Blocks() as demo:
38
+ gr.Markdown("# Íslenskt Whisper – mjög lágt WER")
39
  audio_in = gr.Audio(type="filepath", label="Hladdu upp mp3/wav (allt að 5 mín)")
40
  btn = gr.Button("Transcribe", variant="primary")
41
+ output = gr.Textbox(lines=30, label="Útskrift")
 
42
  btn.click(transcribe_audio, inputs=audio_in, outputs=output)
43
 
44
+ demo.launch(auth=("beta", "beta2025"))