Spaces:

oddadmix
/

egyptian-code-swtiching

Running on Zero

oddadmix commited on Nov 5, 2025

Commit

1c40fc0

verified ·

1 Parent(s): 629c53a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,25 +9,21 @@ import os
 model = None
 processor = None
-@spaces.GPU
-def load_model():
-    """Load the model and processor once at startup"""
-    global model, processor
-    print("Loading model...")
-    model, _ = FastModel.from_pretrained(
-        model_name = "oddadmix/gemma-4b-egyptian-code-switching-b4-g2",
-        dtype = None,
-        max_seq_length = 2048,
-        load_in_4bit = True,  # Enable 4bit for GPU memory efficiency
-        full_finetuning = False,
-    )
-    processor = Gemma3nProcessor.from_pretrained("google/gemma-3n-E4B-it")
-    # Set model to inference mode
-    FastLanguageModel.for_inference(model)
-    print("Model loaded successfully!")
 @spaces.GPU
 def transcribe_audio(audio_path, max_tokens=128):

 model = None
 processor = None
+print("Loading model...")
+model, _ = FastModel.from_pretrained(
+    model_name = "oddadmix/gemma-4b-egyptian-code-switching-b4-g2",
+    dtype = None,
+    max_seq_length = 2048,
+    load_in_4bit = True,  # Enable 4bit for GPU memory efficiency
+    full_finetuning = False,
+)
+processor = Gemma3nProcessor.from_pretrained("google/gemma-3n-E4B-it")
+# Set model to inference mode
+FastLanguageModel.for_inference(model)
+print("Model loaded successfully!")
 @spaces.GPU
 def transcribe_audio(audio_path, max_tokens=128):