Spaces:

shuarya2011
/

Assistant

Running

shuarya2011 commited on 18 days ago

Commit

b3e26e8

verified ·

1 Parent(s): 46c3885

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -21,10 +21,22 @@ MODEL_ID = "google/gemma-4-31B-it-assistant"
 print("Loading tokenizer...")
 tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
 print("Loading model...")
 model = AutoModelForCausalLM.from_pretrained(
     MODEL_ID,
-    torch_dtype=torch.bfloat16,
     device_map="auto",
 )
 model.eval()
@@ -73,11 +85,6 @@ demo = gr.ChatInterface(
     fn=chat,
     title="Gemma 4 Assistant",
     description="google/gemma-4-31B-it-assistant — streaming enabled",
-    examples=[
-        "Explain quantum computing in simple terms",
-        "Write a Python function to reverse a string",
-        "What is photosynthesis?",
-    ],
 )
 demo.launch()

 print("Loading tokenizer...")
 tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
+# Manually set Gemma chat template since tokenizer doesn't include one
+tokenizer.chat_template = (
+    "{% for message in messages %}"
+    "{% if message['role'] == 'user' %}"
+    "user\n{{ message['content'] }}\n"
+    "{% elif message['role'] == 'assistant' %}"
+    "model\n{{ message['content'] }}\n"
+    "{% endif %}"
+    "{% endfor %}"
+    "{% if add_generation_prompt %}model\n{% endif %}"
+)
 print("Loading model...")
 model = AutoModelForCausalLM.from_pretrained(
     MODEL_ID,
+    dtype=torch.bfloat16,
     device_map="auto",
 )
 model.eval()
     fn=chat,
     title="Gemma 4 Assistant",
     description="google/gemma-4-31B-it-assistant — streaming enabled",
 )
 demo.launch()