Spaces:

thava
/

phi3-mini-demo

Sleeping

App Files Files Community

thava commited on Aug 29, 2025

Commit

4df5e6a

1 Parent(s): 17cbe2a

Use pipeline API

Browse files

Files changed (1) hide show

app.v2.py +78 -0

app.v2.py ADDED Viewed

	@@ -0,0 +1,78 @@

+# app.py
+from transformers import pipeline
+import gradio as gr
+# ======================
+# Configuration
+# ======================
+MODEL_ID = "microsoft/Phi-3-mini-128k-instruct"
+# ======================
+# Load Model with pipeline
+# ======================
+print(f"🚀 Loading model: {MODEL_ID}")
+pipe = pipeline(
+    "text-generation",
+    model=MODEL_ID,
+    trust_remote_code=False,
+    torch_dtype="auto",          # Auto-select float16 on GPU
+    device_map="auto",           # Use GPU if available
+    return_full_text=False,      # Only return assistant's reply
+    pad_token_id=198,            # Phi-3: common pad_token_id (for <|endoftext|>)
+)
+print("✅ Pipeline loaded!")
+# ======================
+# Response Function
+# ======================
+def respond(message, history):
+    if not message.strip():
+        return ""
+    # Build conversation using chat template
+    messages = [
+        {"role": "user", "content": msg["content"]}
+        for msg in history
+    ]
+    messages.append({"role": "user", "content": message})
+    # Generate response
+    outputs = pipe(
+        messages,
+        max_new_tokens=1024,
+        temperature=0.7,
+        top_p=0.9,
+        do_sample=True,
+        stop_strings=["<|end|>", "<|endoftext|>"],  # Auto-stopping
+        truncation=True,
+        max_length=128000,
+    )
+    # Extract response text
+    response = outputs[0]["generated_text"] if outputs else ""
+    return response
+# ======================
+# Gradio Interface
+# ======================
+demo = gr.ChatInterface(
+    fn=respond,
+    chatbot=gr.Chatbot(height=600, type="messages"),
+    textbox=gr.Textbox(placeholder="Ask me anything...", container=False, scale=7),
+    title="🧠 Phi-3 Mini (128K) Chat - Simple Pipeline Version",
+    description="A lightweight demo using `transformers.pipeline` for clean, readable code.",
+    examples=[
+        "Who are you?",
+        "Explain quantum computing in simple terms",
+        "Write a Python function to reverse a string"
+    ],
+)
+# ======================
+# Launch
+# ======================
+if __name__ == "__main__":
+    demo.launch()