Spaces:

mo-456
/

FTCE-chatbot

Sleeping

App Files Files Community

mo-456 commited on Jul 19, 2025

Commit

b754287

verified ·

1 Parent(s): 8445ea3

Update app.py

Browse files

Files changed (1) hide show

app.py +29 -31

app.py CHANGED Viewed

@@ -6,23 +6,23 @@ import re
 import os
 from typing import List, Tuple
-# إعداد تسجيل الأحداث
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
-# تحميل نموذج اللغة العربية (MARBERT)
 try:
     model = SentenceTransformer("UBC-NLP/MARBERT", device="cuda" if torch.cuda.is_available() else "cpu")
     logger.info("تم تحميل النموذج بنجاح")
 except Exception as e:
-    logger.error(f"خطأ في تحميل النموذج: {e}")
     raise
-# تحميل المعرفة من knowledge.txt
 def load_knowledge() -> List[str]:
     if not os.path.exists("knowledge.txt"):
         logger.warning("ملف المعرفة غير موجود.")
-        return ["عام: لم يتم العثور على محتوى المعرفة."]
     chunks = []
     current_section = "عام"
@@ -34,16 +34,16 @@ def load_knowledge() -> List[str]:
             elif line:
                 chunks.append(f"{current_section}: {line}")
-    logger.info(f"تم تحميل عدد {len(chunks)} قطعة معرفة.")
     return chunks
 knowledge_chunks = load_knowledge()
 knowledge_embeddings = model.encode(knowledge_chunks, convert_to_tensor=True)
-# تنظيف السؤال وتعديله
 def preprocess_question(question: str) -> str:
     question = re.sub(r'[؟\?،,\.]', '', question).strip()
-    substitutions = {
         r'\bماهي\b': 'ما هي',
         r'\bماهو\b': 'ما هو',
         r'\bكيفية\b': 'كيف',
@@ -52,15 +52,15 @@ def preprocess_question(question: str) -> str:
         r'\bعاوز\b': 'كيف يمكن',
         r'\bعايز\b': 'كيف يمكن'
     }
-    for pattern, replacement in substitutions.items():
-        question = re.sub(pattern, replacement, question)
     return question
-# توليد الرد على السؤال بناءً على أقرب المعرفة
 def generate_response(question: str, top_chunks: List[Tuple[str, float]]) -> str:
     if not top_chunks:
         suggestions = [
-            "أعد صياغة سؤالك بشكل أوضح.",
             "جرّب استخدام كلمات أخرى.",
             "ابحث في قسم مختلف من المعرفة."
         ]
@@ -76,15 +76,13 @@ def generate_response(question: str, top_chunks: List[Tuple[str, float]]) -> str
             sections[section] = []
         sections[section].append((content.strip(), score))
-    # القسم الرئيسي
-    main_section = max(sections.keys(), key=lambda k: sum(s for _, s in sections[k]) / len(sections[k]))
     response = f"سؤالك: {question}\n\n"
     response += f"{main_section}:\n"
     for content, _ in sorted(sections[main_section], key=lambda x: x[1], reverse=True):
         response += f"- {content}\n"
-    # معلومات إضافية
     other_sections = [s for s in sections if s != main_section]
     if other_sections:
         response += "\nمعلومات إضافية:\n"
@@ -92,16 +90,16 @@ def generate_response(question: str, top_chunks: List[Tuple[str, float]]) -> str
             response += f"\nمن {section}:\n"
             for content, _ in sorted(sections[section], key=lambda x: x[1], reverse=True)[:2]:
                 response += f"- {content}\n"
     return response
-# معالجة السؤال من المستخدم
 def answer_question(question: str) -> str:
     if not question or len(question.strip()) < 3:
         return "يرجى إدخال سؤال واضح لا يقل عن ثلاث كلمات."
     question = preprocess_question(question)
-    logger.info(f"جاري معالجة السؤال: {question}")
     try:
         q_embedding = model.encode(question, convert_to_tensor=True)
@@ -122,25 +120,25 @@ def answer_question(question: str) -> str:
         return generate_response(question, top_chunks)
     except Exception as e:
-        logger.error(f"فشل في توليد الإجابة: {e}")
-        return "حدث خطأ أثناء توليد الإجابة. حاول مرة أخرى."
 # واجهة Gradio
-with gr.Blocks(css=\".arabic-ui {direction: rtl; text-align: right; font-family: Tahoma;}\") as demo:
-    with gr.Column(elem_classes=\"arabic-ui\"):
-        gr.Markdown(\"\"\"### المساعد الذكي لوحدة الشفافية بوزارة المالية\nاسأل أي شيء عن الموازنة، المشاركة المجتمعية، أو المشروعات المالية\"\"\")
-        question = gr.Textbox(label=\"سؤالك\", placeholder=\"ما هي أهداف الموازنة التشاركية؟\", lines=3)
-        submit_btn = gr.Button(\"إرسال السؤال\", variant=\"primary\")
-        answer = gr.Textbox(label=\"الإجابة\", lines=12, interactive=False)
         gr.Examples(
             examples=[
-                [\"ما هي أهداف الموازنة التشاركية؟\"],
-                [\"من هي رئيسة وحدة الشفافية؟\"],
-                [\"ما هو دور المواطن في الموازنة؟\"]
             ],
             inputs=question
         )
         submit_btn.click(answer_question, inputs=question, outputs=answer)
-if __name__ == \"__main__\":
-    demo.launch(server_name=\"0.0.0.0\", server_port=7860, share=False)

 import os
 from typing import List, Tuple
+# إعداد التسجيل
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
+# تحميل نموذج MARBERT
 try:
     model = SentenceTransformer("UBC-NLP/MARBERT", device="cuda" if torch.cuda.is_available() else "cpu")
     logger.info("تم تحميل النموذج بنجاح")
 except Exception as e:
+    logger.error(f"فشل تحميل النموذج: {e}")
     raise
+# تحميل المعرفة
 def load_knowledge() -> List[str]:
     if not os.path.exists("knowledge.txt"):
         logger.warning("ملف المعرفة غير موجود.")
+        return ["عام: لا يوجد محتوى معرفي متاح."]
     chunks = []
     current_section = "عام"
             elif line:
                 chunks.append(f"{current_section}: {line}")
+    logger.info(f"تم تحميل {len(chunks)} قطعة معرفة.")
     return chunks
 knowledge_chunks = load_knowledge()
 knowledge_embeddings = model.encode(knowledge_chunks, convert_to_tensor=True)
+# معالجة السؤال
 def preprocess_question(question: str) -> str:
     question = re.sub(r'[؟\?،,\.]', '', question).strip()
+    replacements = {
         r'\bماهي\b': 'ما هي',
         r'\bماهو\b': 'ما هو',
         r'\bكيفية\b': 'كيف',
         r'\bعاوز\b': 'كيف يمكن',
         r'\bعايز\b': 'كيف يمكن'
     }
+    for pattern, repl in replacements.items():
+        question = re.sub(pattern, repl, question)
     return question
+# توليد الرد
 def generate_response(question: str, top_chunks: List[Tuple[str, float]]) -> str:
     if not top_chunks:
         suggestions = [
+            "أعد صياغة سؤالك.",
             "جرّب استخدام كلمات أخرى.",
             "ابحث في قسم مختلف من المعرفة."
         ]
             sections[section] = []
         sections[section].append((content.strip(), score))
+    main_section = max(sections, key=lambda s: sum(x[1] for x in sections[s]) / len(sections[s]))
     response = f"سؤالك: {question}\n\n"
     response += f"{main_section}:\n"
     for content, _ in sorted(sections[main_section], key=lambda x: x[1], reverse=True):
         response += f"- {content}\n"
     other_sections = [s for s in sections if s != main_section]
     if other_sections:
         response += "\nمعلومات إضافية:\n"
             response += f"\nمن {section}:\n"
             for content, _ in sorted(sections[section], key=lambda x: x[1], reverse=True)[:2]:
                 response += f"- {content}\n"
     return response
+# الرد النهائي
 def answer_question(question: str) -> str:
     if not question or len(question.strip()) < 3:
         return "يرجى إدخال سؤال واضح لا يقل عن ثلاث كلمات."
     question = preprocess_question(question)
+    logger.info(f"معالجة السؤال: {question}")
     try:
         q_embedding = model.encode(question, convert_to_tensor=True)
         return generate_response(question, top_chunks)
     except Exception as e:
+        logger.error(f"خطأ أثناء توليد الإجابة: {e}")
+        return "حدث خطأ غير متوقع أثناء توليد الإجابة."
 # واجهة Gradio
+with gr.Blocks(css=".arabic-ui {direction: rtl; text-align: right; font-family: Tahoma;}") as demo:
+    with gr.Column(elem_classes="arabic-ui"):
+        gr.Markdown("### المساعد الذكي لوحدة الشفافية\nاسأل عن الموازنة، المشاركة المجتمعية، أو الشفافية المالية.")
+        question = gr.Textbox(label="سؤالك", placeholder="مثال: ما هي أهداف الموازنة التشاركية؟", lines=3)
+        submit_btn = gr.Button("إرسال السؤال", variant="primary")
+        answer = gr.Textbox(label="الإجابة", lines=12, interactive=False)
         gr.Examples(
             examples=[
+                ["ما هي أهداف الموازنة التشاركية؟"],
+                ["من هي رئيسة وحدة الشفافية؟"],
+                ["ما هو دور المواطن في إعداد الموازنة؟"]
             ],
             inputs=question
         )
         submit_btn.click(answer_question, inputs=question, outputs=answer)
+if __name__ == "__main__":
+    demo.launch(server_name="0.0.0.0", server_port=7860, share=False)