Spaces:

raksama19
/

Test-Voice-Chatbot

Sleeping

raksama19 commited on Jul 18, 2025

Commit

6ed2a3f

verified ·

1 Parent(s): 2160785

Update gemma_inference.py

Files changed (1) hide show

gemma_inference.py CHANGED Viewed

@@ -9,6 +9,7 @@ from typing import Generator, Optional
 import numpy as np
 from utils.snac_utils import generate_audio_data, get_snac
 from utils.vad import get_speech_timestamps, collect_chunks
 class GemmaOmniInference:
     """
@@ -20,15 +21,24 @@ class GemmaOmniInference:
         self.device = device
         self.model_id = model_id
         # Initialize models
         print("Loading Gemma 3n model...")
         self.model = Gemma3nForConditionalGeneration.from_pretrained(
             model_id,
             device_map="auto",
-            torch_dtype=torch.bfloat16
         ).eval()
-        self.processor = AutoProcessor.from_pretrained(model_id)
         # Keep the audio processing models
         print("Loading audio processing models...")

 import numpy as np
 from utils.snac_utils import generate_audio_data, get_snac
 from utils.vad import get_speech_timestamps, collect_chunks
+from huggingface_hub import login
 class GemmaOmniInference:
     """
         self.device = device
         self.model_id = model_id
+        # Authenticate with Hugging Face
+        hf_token = os.getenv("HF_TOKEN")
+        if hf_token:
+            print("Authenticating with Hugging Face...")
+            login(token=hf_token)
+        else:
+            print("Warning: HF_TOKEN not found. Make sure to set it in Space secrets.")
         # Initialize models
         print("Loading Gemma 3n model...")
         self.model = Gemma3nForConditionalGeneration.from_pretrained(
             model_id,
             device_map="auto",
+            torch_dtype=torch.bfloat16,
+            token=hf_token
         ).eval()
+        self.processor = AutoProcessor.from_pretrained(model_id, token=hf_token)
         # Keep the audio processing models
         print("Loading audio processing models...")