Spaces:

FrederickSundeep
/

ChatMate

Sleeping

FrederickSundeep commited on Jun 26, 2025

Commit

2b29a6a

1 Parent(s): 6698e40

update commit with phi-3 mini 5

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,14 +1,19 @@
 import gradio as gr
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
 # Load Phi-3 Mini model
 model_id = "microsoft/phi-3-mini-4k-instruct"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
-    model_id, torch_dtype="auto", device_map="auto"
-)
-pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)
 # OpenAI-style messages (new format)
 def chat_fn(message, history):
@@ -29,11 +34,10 @@ def chat_fn(message, history):
     return reply
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown("## 💬 Chat with Phi-3 Mini")
-    gr.Markdown(
-        "Welcome to your AI Assistant powered by Phi-3 Mini. Ask me anything or request code examples!"
-    )
     gr.ChatInterface(
         fn=chat_fn,
@@ -43,7 +47,8 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
             "Write a JavaScript function to reverse a string.",
             "Explain how transformers work.",
         ],
-        chatbot=gr.Chatbot(type="messages")  # fixes the deprecated tuples warning
     )
-demo.launch(share=True)

 import gradio as gr
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
+import torch
+# Force device based on availability
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+print(f"Using device: {device}")
 # Load Phi-3 Mini model
 model_id = "microsoft/phi-3-mini-4k-instruct"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
+    model_id, torch_dtype=torch.float16 if device.type == "cuda" else torch.float32
+).to(device)
+pipe = pipeline("text-generation", model=model, tokenizer=tokenizer, device=0 if device.type == "cuda" else -1)
 # OpenAI-style messages (new format)
 def chat_fn(message, history):
     return reply
+# Gradio UI
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown("## 💬 Chat with Phi-3 Mini")
+    gr.Markdown("Lightweight AI Assistant powered by Microsoft's Phi-3 Mini. Works best with short prompts. Ask away!")
     gr.ChatInterface(
         fn=chat_fn,
             "Write a JavaScript function to reverse a string.",
             "Explain how transformers work.",
         ],
+        chatbot=gr.Chatbot(type="messages")
     )
+# Launch without SSR and share (for Spaces)
+demo.launch(debug=True, ssr_mode=False)