Spaces:

HexQuant
/

Pars-Medical-o1-Chatbot

Build error

App Files Files Community

HexQuant commited on 26 days ago

Commit

c0284f8

verified ·

1 Parent(s): ee072b7

Update app.py

Browse files

Files changed (1) hide show

app.py +44 -92

app.py CHANGED Viewed

@@ -1,149 +1,101 @@
 import gradio as gr
-from llama_cpp import Llama
 import os
-# Download and load model
-print("🔄 Loading model...")
-llm = Llama.from_pretrained(
     repo_id="HexQuant/Pars-Medical-o1-Llama-FFT-GGUF",
     filename="Pars-Medical-o1-Llama-FFT-Q4_K_M.gguf",
     n_ctx=2048,
     n_threads=2,
-    n_gpu_layers=0,  # CPU only for free tier
     verbose=False,
 )
 print("✅ Model loaded!")
-# System prompt
-SYSTEM_PROMPT = """You are Pars-Medical, a bilingual (Persian/English) medical AI assistant with chain-of-thought reasoning.
-When answering:
-1. First, analyze the question in <think> tags
-2. Then provide a clear, helpful answer
-You can respond in both Persian (Farsi) and English based on the user's language.
-⚠️ Important: You are for educational purposes only. Always recommend consulting a real doctor for medical decisions."""
 def respond(message, history):
-    """Generate response for the chatbot"""
-    # Build messages
     messages = [{"role": "system", "content": SYSTEM_PROMPT}]
-    # Add history
     for user_msg, assistant_msg in history:
         messages.append({"role": "user", "content": user_msg})
         if assistant_msg:
             messages.append({"role": "assistant", "content": assistant_msg})
-    # Add current message
     messages.append({"role": "user", "content": message})
-    # Generate response
     response = llm.create_chat_completion(
         messages=messages,
         max_tokens=512,
         temperature=0.7,
-        top_p=0.9,
         stream=True,
     )
-    # Stream response
-    partial_message = ""
     for chunk in response:
-        if "choices" in chunk and len(chunk["choices"]) > 0:
-            delta = chunk["choices"][0].get("delta", {})
-            if "content" in delta:
-                partial_message += delta["content"]
-                yield partial_message
-# Example questions
 EXAMPLES = [
     ["علائم دیابت نوع ۲ چیست؟"],
     ["What are the symptoms of hypothyroidism?"],
-    ["سردرد میگرنی چه تفاوتی با سردرد تنشی دارد؟"],
-    ["How do I differentiate between viral and bacterial infections?"],
-    ["فشار خون بالا چه عوارضی دارد؟"],
-    ["What are the warning signs of a heart attack?"],
 ]
-# Custom CSS
-CSS = """
-.gradio-container {
-    font-family: 'Vazirmatn', 'Segoe UI', sans-serif !important;
-}
-.contain {
-    max-width: 900px !important;
-    margin: auto !important;
-}
-footer {
-    display: none !important;
-}
-"""
-# Build Gradio interface
-with gr.Blocks(css=CSS, title="🩺 Pars-Medical AI") as demo:
     gr.HTML("""
-    <div style="text-align: center; padding: 20px;">
         <h1>🩺 Pars-Medical-o1</h1>
-        <h3>دستیار هوش مصنوعی پزشکی دوزبانه | Bilingual Medical AI Assistant</h3>
-        <p style="color: #666;">
-            <a href="https://huggingface.co/HexQuant/Pars-Medical-o1-Llama-FFT" target="_blank">🤗 Model</a> |
-            <a href="https://twitter.com/xPOURY4" target="_blank">🐦 Twitter</a> |
-            <a href="https://github.com/xPOURY4" target="_blank">💻 GitHub</a>
         </p>
     </div>
     """)
-    chatbot = gr.Chatbot(
-        height=450,
-        placeholder="سوال پزشکی خود را بپرسید... | Ask your medical question...",
-        show_label=False,
-    )
-    msg = gr.Textbox(
-        placeholder="پیام خود را بنویسید... | Type your message...",
-        show_label=False,
-        container=False,
-        scale=7,
-    )
     with gr.Row():
-        submit_btn = gr.Button("ارسال | Send", variant="primary", scale=1)
-        clear_btn = gr.Button("پاک کردن | Clear", scale=1)
-    gr.Examples(
-        examples=EXAMPLES,
-        inputs=msg,
-        label="💡 نمونه سوالات | Example Questions"
-    )
     gr.HTML("""
-    <div style="text-align: center; padding: 15px; margin-top: 20px; background: #fff3cd; border-radius: 10px;">
-        <p style="color: #856404; margin: 0;">
-            ⚠️ <b>توجه:</b> این مدل صرفاً جهت آموزش است و جایگزین مشاوره پزشکی نیست.<br>
-            ⚠️ <b>Disclaimer:</b> This is for educational purposes only. Not a substitute for professional medical advice.
-        </p>
     </div>
     """)
-    gr.HTML("""
-    <div style="text-align: center; padding: 10px; color: #888;">
-        Made with ❤️ by <a href="https://twitter.com/xPOURY4">@xPOURY4</a> in Iran 🇮🇷
-    </div>
-    """)
-    # Event handlers
     msg.submit(respond, [msg, chatbot], chatbot).then(lambda: "", None, msg)
-    submit_btn.click(respond, [msg, chatbot], chatbot).then(lambda: "", None, msg)
-    clear_btn.click(lambda: None, None, chatbot)
-if __name__ == "__main__":
-    demo.queue().launch()

 import gradio as gr
+from huggingface_hub import hf_hub_download
 import os
+# Download model first
+print("📥 Downloading GGUF model...")
+model_path = hf_hub_download(
     repo_id="HexQuant/Pars-Medical-o1-Llama-FFT-GGUF",
     filename="Pars-Medical-o1-Llama-FFT-Q4_K_M.gguf",
+)
+print(f"✅ Model downloaded: {model_path}")
+# Now import and load
+from llama_cpp import Llama
+print("🔄 Loading model...")
+llm = Llama(
+    model_path=model_path,
     n_ctx=2048,
     n_threads=2,
+    n_gpu_layers=0,
     verbose=False,
 )
 print("✅ Model loaded!")
+SYSTEM_PROMPT = """You are Pars-Medical, a bilingual (Persian/English) medical AI assistant.
+When answering medical questions:
+1. Analyze the question carefully
+2. Think step-by-step (you can use <think> tags for reasoning)
+3. Provide accurate, helpful medical information
+You respond in the same language as the user (Persian or English).
+⚠️ Disclaimer: This is for educational purposes only. Always consult a real doctor."""
 def respond(message, history):
     messages = [{"role": "system", "content": SYSTEM_PROMPT}]
     for user_msg, assistant_msg in history:
         messages.append({"role": "user", "content": user_msg})
         if assistant_msg:
             messages.append({"role": "assistant", "content": assistant_msg})
     messages.append({"role": "user", "content": message})
     response = llm.create_chat_completion(
         messages=messages,
         max_tokens=512,
         temperature=0.7,
         stream=True,
     )
+    partial = ""
     for chunk in response:
+        if chunk["choices"][0].get("delta", {}).get("content"):
+            partial += chunk["choices"][0]["delta"]["content"]
+            yield partial
 EXAMPLES = [
     ["علائم دیابت نوع ۲ چیست؟"],
     ["What are the symptoms of hypothyroidism?"],
+    ["سردرد میگرنی چه علائمی دارد؟"],
+    ["How to differentiate viral from bacterial infection?"],
 ]
+with gr.Blocks(title="🩺 Pars-Medical-o1") as demo:
     gr.HTML("""
+    <div style="text-align:center; padding:20px;">
         <h1>🩺 Pars-Medical-o1</h1>
+        <p>دستیار پزشکی دوزبانه فارسی-انگلیسی | Bilingual Medical AI</p>
+        <p>
+            <a href="https://huggingface.co/HexQuant/Pars-Medical-o1-Llama-FFT">🤗 Model</a> |
+            <a href="https://twitter.com/xPOURY4">🐦 @xPOURY4</a>
         </p>
     </div>
     """)
+    chatbot = gr.Chatbot(height=400)
+    msg = gr.Textbox(placeholder="سوال پزشکی خود را بپرسید... | Ask your question...", show_label=False)
     with gr.Row():
+        submit = gr.Button("ارسال | Send", variant="primary")
+        clear = gr.Button("پاک کردن | Clear")
+    gr.Examples(examples=EXAMPLES, inputs=msg)
     gr.HTML("""
+    <div style="text-align:center; padding:10px; background:#fff3cd; border-radius:8px; margin-top:15px;">
+        ⚠️ فقط برای آموزش | Educational purposes only - Not medical advice
     </div>
+    <p style="text-align:center; color:#888; margin-top:10px;">Made with ❤️ by @xPOURY4 🇮🇷</p>
     """)
     msg.submit(respond, [msg, chatbot], chatbot).then(lambda: "", None, msg)
+    submit.click(respond, [msg, chatbot], chatbot).then(lambda: "", None, msg)
+    clear.click(lambda: None, None, chatbot)
+demo.queue().launch()