Spaces:

FrederickSundeep
/

ChatMate

Sleeping

App Files Files Community

FrederickSundeep commited on Jun 26, 2025

Commit

cab7f8a

1 Parent(s): 1549b17

update commit with phi-3 mini 1114

Browse files

Files changed (1) hide show

app.py +12 -21

app.py CHANGED Viewed

@@ -1,26 +1,22 @@
 import gradio as gr
-import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
-# ✅ Force ZeroGPU to allocate GPU early
 try:
-    _ = torch.tensor([1.0], device="cuda")
-    print("✅ ZeroGPU triggered successfully.")
-except Exception as e:
-    print(f"⚠️ GPU allocation failed: {e}")
-# 🚀 Load Phi-3 Mini model
 model_id = "microsoft/phi-3-mini-4k-instruct"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
-    model_id,
-    torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
-    device_map="auto"
 )
 pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)
-# 💬 Chat function
 def chat_fn(message, history):
     history_text = ""
     for item in history:
@@ -33,18 +29,14 @@ def chat_fn(message, history):
     result = pipe(prompt, max_new_tokens=512, do_sample=True, temperature=0.7)[0]['generated_text']
     reply = result.split("<|assistant|>")[-1].strip()
-    # Format code blocks if applicable
-    if "```" not in reply and any(w in reply for w in ["def ", "class ", "import "]):
         reply = f"```\n{reply}\n```"
     return reply
-# 🧩 Gradio UI
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown("## 💬 Chat with Phi-3 Mini")
-    gr.Markdown(
-        "Welcome to your AI Assistant powered by Phi-3 Mini and ZeroGPU (uses GPU if available)."
-    )
     gr.ChatInterface(
         fn=chat_fn,
@@ -57,5 +49,4 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
         chatbot=gr.Chatbot(type="messages")
     )
-# 🚀 Launch
-demo.launch(ssr_mode=False)

 import gradio as gr
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
+# ✅ Safe import of the GPU decorator
 try:
+    from spaces import GPU
+except ImportError:
+    def GPU(func): return func  # Fallback if not in a HF Space
+# ✅ Load Phi-3 Mini model
 model_id = "microsoft/phi-3-mini-4k-instruct"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
+    model_id, torch_dtype="auto", device_map="auto"
 )
 pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)
+# ✅ Apply GPU decorator to ensure ZeroGPU allocates GPU
+@GPU
 def chat_fn(message, history):
     history_text = ""
     for item in history:
     result = pipe(prompt, max_new_tokens=512, do_sample=True, temperature=0.7)[0]['generated_text']
     reply = result.split("<|assistant|>")[-1].strip()
+    if "```" not in reply and any(word in reply for word in ["def ", "class ", "import "]):
         reply = f"```\n{reply}\n```"
     return reply
+# ✅ Gradio UI
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown("## 💬 Chat with Phi-3 Mini")
+    gr.Markdown("Welcome to your AI Assistant powered by Phi-3 Mini. Ask me anything or request code examples!")
     gr.ChatInterface(
         fn=chat_fn,
         chatbot=gr.Chatbot(type="messages")
     )
+demo.launch()