ASR_API2 / app.py
palli23's picture
update3
c95f5de
raw
history blame
1.19 kB
# app.py – NÚNA VIRKAR Á ZeroGPU (A100/T4)
import os
import gradio as gr
import spaces # MÁGÍSKUR – virkjar ZeroGPU
from transformers import pipeline
# ÞITT private model
MODEL_NAME = "palli23/whisper-small-sam_spjall"
# Þetta fall keyrir á GPU í ZeroGPU
@spaces.GPU
def transcribe(audio):
if not audio:
return "Hladdu upp hljóðskrá"
# Módel hleðst á GPU í fyrsta skipti (cached)
pipe = pipeline(
"automatic-speech-recognition",
model=MODEL_NAME,
device=0, # 0 = GPU (ZeroGPU gefur þér A100/T4)
token=os.getenv("HF_TOKEN")
)
result = pipe(audio, batch_size=8)
return result["text"]
# Einfalt interface
with gr.Blocks(title="Íslenskt ASR – ZeroGPU Live") as demo:
gr.Markdown("# Íslenskt ASR – ZeroGPU (A100/T4)")
gr.Markdown("**~4 % WER · 0.2× RTF · Keyrir á GPU núna**")
audio = gr.Audio(type="filepath", label="Hladdu upp .mp3 / .wav")
btn = gr.Button("Transcribe (15–25 sek)", variant="primary", size="lg")
out = gr.Textbox(lines=25, label="Útskrift")
btn.click(transcribe, audio, out)
demo.launch(auth=("beta", "beta2025"))