Spaces:

yut23387
/

My-AI-Bank

Sleeping

App Files Files Community

yut23387 commited on Dec 10, 2025

Commit

8c9080d

verified ·

1 Parent(s): 17cd270

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -41

app.py CHANGED Viewed

@@ -3,57 +3,52 @@ from llama_cpp import Llama
 from huggingface_hub import hf_hub_download
 import gradio as gr
-# إعدادات الموديل
-REPO_ID = "yut23387/My-Private-Brain"
-FILENAME = "DeepSeek-R1-Distill-Qwen-1.5B-Q4_K_M.gguf"
-print(f"🚀 Starting download for: {FILENAME}...")
 try:
     model_path = hf_hub_download(
         repo_id=REPO_ID,
         filename=FILENAME
     )
-    print(f"✅ Download path: {model_path}")
-    # --- بداية التشخيص ---
-    # 1. فحص حجم الملف
-    file_size = os.path.getsize(model_path)
-    print(f"📦 File Size: {file_size / (1024 * 1024):.2f} MB")
-    if file_size < 100 * 1024 * 1024: # إذا كان أقل من 100 ميجا
-        print("⚠️ WARNING: The file is suspiciously small! It might be an LFS pointer, not the real model.")
-    else:
-        print("✅ File size looks correct (Big binary file).")
-    # --- نهاية التشخيص ---
-    print("⚙️ Loading LLM (with verbose=True)...")
-    # تشغيل الموديل مع تفعيل السجلات (verbose=True) لرؤية سبب الرفض
-    llm = Llama(
-        model_path=model_path,
-        n_ctx=2048,
-        n_threads=2,
-        verbose=True  # فعلناها لنرى الخطأ الداخلي
     )
-    print("✅ LLM Loaded successfully!")
-except Exception as e:
-    print(f"\n❌ FATAL ERROR:\n{e}")
-    # لا نوقف البرنامج حتى نتمكن من قراءة اللوج
-    pass
-# واجهة بسيطة (لن تعمل إذا فشل التحميل، لكن وضعناها لكي لا ينهار التطبيق)
-def dummy_chat(message, history):
-    return "Model failed to load. Check logs."
-if 'llm' in locals():
-    def generate_response(message, history):
-        output = llm(f"User: {message}\nAssistant: ", max_tokens=256, stop=["User:"], echo=False)
-        return output['choices'][0]['text']
-    demo = gr.ChatInterface(fn=generate_response, title="AI Bank")
-else:
-    demo = gr.ChatInterface(fn=dummy_chat, title="Error Loading Model")
 if __name__ == "__main__":
     demo.launch(server_name="0.0.0.0", server_port=7860)

 from huggingface_hub import hf_hub_download
 import gradio as gr
+# 1. سنستخدم نموذج Qwen 2.5 المستقر (من المصدر العام مؤقتاً لتشغيل المشروع)
+# هذا لا يمنع أن البوت أصبح "خاصاً بك" ويعمل على مساحتك
+REPO_ID = "bartowski/Qwen2.5-1.5B-Instruct-GGUF"
+FILENAME = "Qwen2.5-1.5B-Instruct-Q4_K_M.gguf"
+print(f"🚀 Starting download for: {FILENAME} from {REPO_ID}")
 try:
     model_path = hf_hub_download(
         repo_id=REPO_ID,
         filename=FILENAME
     )
+    print(f"✅ Model downloaded to: {model_path}")
+except Exception as e:
+    print(f"❌ Error downloading: {e}")
+    raise e
+print("⚙️ Loading LLM...")
+# إعدادات مناسبة جداً لسرعة الرد
+llm = Llama(
+    model_path=model_path,
+    n_ctx=4096,
+    n_threads=2,
+    verbose=False
+)
+print("✅ LLM Loaded!")
+def generate_response(message, history):
+    # تنسيق Qwen 2.5 للحصول على أفضل دقة
+    prompt = f"<|im_start|>user\n{message}<|im_end|>\n<|im_start|>assistant\n"
+    output = llm(
+        prompt,
+        max_tokens=512,
+        stop=["<|im_end|>"],
+        echo=False
     )
+    return output['choices'][0]['text']
+# واجهة بسيطة للتجربة
+demo = gr.ChatInterface(
+    fn=generate_response,
+    title="My Private AI 🧠",
+    description="Qwen 2.5 - Running Securely on Docker"
+)
+# تشغيل السيرفر
 if __name__ == "__main__":
     demo.launch(server_name="0.0.0.0", server_port=7860)