Spaces:

FrederickSundeep
/

ChatMate

Sleeping

FrederickSundeep commited on Jun 26, 2025

Commit

daf4465

1 Parent(s): fefedde

update commit with phi-3 mini 2

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,7 +5,9 @@ from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
 model_id = "microsoft/phi-3-mini-4k-instruct"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
-    model_id, torch_dtype="auto", device_map="auto"
 )
 pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)
@@ -18,20 +20,29 @@ def chat_fn(message, history):
     prompt = f"{history_text}<|user|>\n{message}\n<|assistant|>\n"
     response = pipe(prompt, max_new_tokens=512, do_sample=True, temperature=0.7)[0]['generated_text']
     reply = response.split("<|assistant|>")[-1].strip()
     return reply
-# Wrap with Blocks for custom layout and auth
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown("## 💬 Chat with Phi-3 Mini")
-    gr.Markdown("Welcome! Lightweight, fast, and privacy-focused AI assistant powered by Microsoft's Phi-3. You can ask questions, request code, or chat naturally.")
-    gr.ChatInterface(fn=chat_fn,
-                     examples=["What is a large language model?", "Write a Python function to reverse a list.", "Explain the concept of recursion."],
-                     title="",
-                     retry_btn="↻ Retry",
-                     undo_btn="⤺ Undo",
-                     clear_btn="🧹 Clear"
-                     )
-# Add authentication here
 demo.launch(auth=("user", "pass"))

 model_id = "microsoft/phi-3-mini-4k-instruct"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
+    model_id,
+    torch_dtype="auto",
+    device_map="auto"  # Will default to CPU if no GPU available
 )
 pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)
     prompt = f"{history_text}<|user|>\n{message}\n<|assistant|>\n"
     response = pipe(prompt, max_new_tokens=512, do_sample=True, temperature=0.7)[0]['generated_text']
     reply = response.split("<|assistant|>")[-1].strip()
+    # Format as Markdown code block if reply looks like code
+    if "```" not in reply and any(keyword in reply for keyword in ["def ", "class ", "import ", ";", "{", "}"]):
+        reply = f"```\n{reply}\n```"
     return reply
+# Launch the app with basic Blocks + authentication
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown("## 💬 Chat with Phi-3 Mini")
+    gr.Markdown(
+        "Welcome! A lightweight, privacy-friendly AI assistant powered by Microsoft's Phi-3 Mini.\n"
+        "Ask any question or request code examples. Use your credentials to access this demo."
+    )
+    gr.ChatInterface(
+        fn=chat_fn,
+        examples=[
+            "What is a large language model?",
+            "Write a Python function to reverse a list.",
+            "Explain the concept of recursion."
+        ],
+        title="",
+    )
 demo.launch(auth=("user", "pass"))