palli23 commited on
Commit
5f7601c
·
verified ·
1 Parent(s): a4070be

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -23
app.py CHANGED
@@ -1,4 +1,4 @@
1
- # app.py — Your original working version + repetition_penalty=1.2 + ngram=3
2
 
3
  import os
4
  os.environ["OMP_NUM_THREADS"] = "1"
@@ -19,31 +19,19 @@ def transcribe_3min(audio_path):
19
  return "Hlaðið upp hljóðskrá"
20
 
21
  pipe = pipeline(
22
- "automatic-speech-recognition",
23
- #model="palli23/whisper-tiny-icelandic-distilled-v3",
24
- #model = "palli23/whisper-tiny-distilled-spjallromur-polish-v3",
25
- #odel = "palli23/whisper-tiny-distilled-spjallromur-polish-v5",
26
- #model="palli23/whisper-tiny-distilled-samromur-spjallromur-polish",
27
- #model="palli23/whisper-tiny-samromur-spjallromur",
28
- model="palli23/whisper-small-sam_spjall",
29
- torch_dtype=torch.float16,
30
- device=0, # GPU inside @spaces.GPU
31
  )
32
 
33
  result = pipe(
34
  audio_path,
35
- chunk_length_s=30,
36
- batch_size=8,
37
- return_timestamps=False, # ← no timestamps, as you want
38
- generate_kwargs={
39
- "num_beams": 5, #var beam size 1
40
- "repetition_penalty": 1.2, # ← exactly what you asked for
41
- "no_repeat_ngram_size": 3, # ← exactly what you asked for
42
- "temperature": 0.0,
43
- }
44
  )
45
 
46
- # Clean memory so ZeroGPU lives forever
47
  del pipe
48
  gc.collect()
49
  torch.cuda.empty_cache()
@@ -54,8 +42,8 @@ def transcribe_3min(audio_path):
54
  # UI – clean and simple
55
  # ——————————————————————————————
56
  with gr.Blocks() as demo:
57
- gr.Markdown("# Íslenskt ASR – 3 mínútur")
58
- gr.Markdown("**palli23/whisper-small-sam_spjall** · mjög lágur WER · allt að 5 mín hljóð")
59
  gr.Markdown("**Hafa samband:** pallinr1@protonmail.com")
60
 
61
  audio_in = gr.Audio(type="filepath", label="Hlaðið upp .mp3 / .wav")
@@ -72,4 +60,4 @@ demo.launch(
72
  server_name="0.0.0.0",
73
  server_port=7860,
74
  auth=None
75
- )
 
1
+ # app.py — wav2vec2 CTC ASR (ZeroGPU safe)
2
 
3
  import os
4
  os.environ["OMP_NUM_THREADS"] = "1"
 
19
  return "Hlaðið upp hljóðskrá"
20
 
21
  pipe = pipeline(
22
+ task="automatic-speech-recognition",
23
+ model="palli23/wav2vec2-xlsr-300m-icelandic",
24
+ # model="palli23/wav2vec2-icelandic-multi-aug-v2-5e-6", # ← alt model (commented)
25
+ torch_dtype=torch.float32, # wav2vec2 requires fp32
26
+ device=0,
 
 
 
 
27
  )
28
 
29
  result = pipe(
30
  audio_path,
31
+ chunk_length_s=20, # safe chunking for wav2vec2
 
 
 
 
 
 
 
 
32
  )
33
 
34
+ # Clean memory so ZeroGPU survives
35
  del pipe
36
  gc.collect()
37
  torch.cuda.empty_cache()
 
42
  # UI – clean and simple
43
  # ——————————————————————————————
44
  with gr.Blocks() as demo:
45
+ gr.Markdown("# Íslenskt ASR – wav2vec2")
46
+ gr.Markdown("**palli23/wav2vec2-xlsr-300m-icelandic** · CTC · mjög hraðvirkt")
47
  gr.Markdown("**Hafa samband:** pallinr1@protonmail.com")
48
 
49
  audio_in = gr.Audio(type="filepath", label="Hlaðið upp .mp3 / .wav")
 
60
  server_name="0.0.0.0",
61
  server_port=7860,
62
  auth=None
63
+ )