| | import gradio as gr |
| | import requests |
| |
|
| | API_URL = "http://localhost:7860/completion" |
| |
|
| | SYSTEM_PROMPT = """You are Roy – an AI assistant created and fine-tuned by Souvik Pramanick. |
| | Be friendly, concise and helpful. Never mention internal tokens like [/INST].""" |
| |
|
| | def chat(message, history): |
| | prompt = SYSTEM_PROMPT + "\n\n" |
| |
|
| | for user, bot in history: |
| | prompt += f"User: {user}\nRoy: {bot}\n" |
| |
|
| | prompt += f"User: {message}\nRoy:" |
| |
|
| | payload = { |
| | "prompt": prompt, |
| | "n_predict": 120, |
| | "temperature": 0.7, |
| | "stop": ["User:"] |
| | } |
| |
|
| | try: |
| | r = requests.post(API_URL, json=payload, timeout=300) |
| | text = r.json().get("content", "") |
| | except Exception: |
| | return "⚠ Backend busy – please wait a few seconds and try again." |
| |
|
| | |
| | text = text.replace("[/INST]", "").strip() |
| |
|
| | return text |
| |
|
| |
|
| | demo = gr.ChatInterface( |
| | fn=chat, |
| | title="Roy AI", |
| | description="Personal AI created by Souvik Pramanick", |
| | examples=[ |
| | "Who created you?", |
| | "Explain AI in 3 lines", |
| | "Give Python roadmap" |
| | ], |
| | ) |
| |
|
| | demo.launch(server_name="0.0.0.0", server_port=7861) |
| |
|