Spaces:

mo-456
/

FTCE-chatbot

Sleeping

App Files Files Community

mo-456 commited on Jul 15, 2025

Commit

aa409b7

verified ·

1 Parent(s): 397fe86

Update app.py

Browse files

Files changed (1) hide show

app.py +54 -24

app.py CHANGED Viewed

@@ -1,18 +1,38 @@
-from fastapi import FastAPI
 import gradio as gr
 from sentence_transformers import SentenceTransformer, util
 import torch
-# Load model (auto-downloads if not cached)
-model = SentenceTransformer("CAMeL-Lab/bert-base-arabic-camelbert-ca")
-# Load knowledge file and generate embeddings
-with open("knowledge.txt", "r", encoding="utf-8") as f:
-    knowledge_text = f.read()
-# Split the text into chunks
-def split_text(text, chunk_size=400):
-    sentences = text.split("،")  # Split on Arabic comma
     chunks, chunk = [], ""
     for sentence in sentences:
         if len(chunk) + len(sentence) < chunk_size:
@@ -24,29 +44,39 @@ def split_text(text, chunk_size=400):
         chunks.append(chunk.strip())
     return chunks
-chunks = split_text(knowledge_text)
-corpus_embeddings = model.encode(chunks, convert_to_tensor=True)
 # Search function
 def answer_question(question):
-    question_embedding = model.encode(question, convert_to_tensor=True)
-    scores = util.cos_sim(question_embedding, corpus_embeddings)[0]
-    best_idx = torch.argmax(scores).item()
-    return chunks[best_idx]
 # Gradio UI
 with gr.Blocks() as demo:
     gr.Markdown("### 🤖 اسأل عن التنمية المستدامة أو الموازنة التشاركية")
     with gr.Row():
-        inp = gr.Textbox(label="اكتب سؤالك هنا", placeholder="مثال: ما هي أهداف التنمية المستدامة؟")
-    out = gr.Textbox(label="الإجابة")
     btn = gr.Button("إجابة")
     btn.click(fn=answer_question, inputs=inp, outputs=out)
-# FastAPI + Gradio mount
-app = FastAPI()
-@app.get("/")
-def read_root():
-    return {"message": "Arabic Q&A Chatbot running."}
-app = gr.mount_gradio_app(app, demo, path="/")

 import gradio as gr
 from sentence_transformers import SentenceTransformer, util
 import torch
+import logging
+# Set up logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+# Load model
+logger.info("Loading model...")
+try:
+    model = SentenceTransformer("CAMeL-Lab/bert-base-arabic-camelbert-ca")
+except Exception as e:
+    logger.error(f"Failed to load model: {e}")
+    raise
+# Load knowledge file
+logger.info("Loading knowledge file...")
+try:
+    with open("knowledge.txt", "r", encoding="utf-8") as f:
+        knowledge_text = f.read()
+    if not knowledge_text.strip():
+        raise ValueError("knowledge.txt is empty")
+except FileNotFoundError:
+    logger.error("knowledge.txt not found")
+    raise
+except Exception as e:
+    logger.error(f"Error reading knowledge.txt: {e}")
+    raise
+# Split text into chunks
+def split_text(text, chunk_size=200):
+    logger.info("Splitting text into chunks...")
+    sentences = text.split("،")
     chunks, chunk = [], ""
     for sentence in sentences:
         if len(chunk) + len(sentence) < chunk_size:
         chunks.append(chunk.strip())
     return chunks
+# Generate embeddings
+logger.info("Generating embeddings...")
+try:
+    chunks = split_text(knowledge_text)
+    corpus_embeddings = model.encode(chunks, convert_to_tensor=True, batch_size=16)
+except Exception as e:
+    logger.error(f"Error generating embeddings: {e}")
+    raise
 # Search function
 def answer_question(question):
+    try:
+        if not question.strip():
+            return "الرجاء إدخال سؤال."
+        question_embedding = model.encode(question, convert_to_tensor=True)
+        scores = util.cos_sim(question_embedding, corpus_embeddings)[0]
+        best_idx = torch.argmax(scores).item()
+        score = scores[best_idx].item()
+        logger.info(f"Question: {question}, Best chunk: {chunks[best_idx][:50]}..., Score: {score:.4f}")
+        return chunks[best_idx] if score > 0.3 else "عذرًا، لم أجد إجابة مناسبة. حاول صياغة السؤال بطريقة أخرى."
+    except Exception as e:
+        logger.error(f"Error answering question: {e}")
+        return "حدث خطأ أثناء معالجة السؤال. حاول مرة أخرى."
 # Gradio UI
+logger.info("Setting up Gradio UI...")
 with gr.Blocks() as demo:
     gr.Markdown("### 🤖 اسأل عن التنمية المستدامة أو الموازنة التشاركية")
     with gr.Row():
+        inp = gr.Textbox(label="اكتب سؤالك هنا", placeholder="مثال: ما هي أهداف التنمية المستدامة؟", dir="rtl")
+    out = gr.Textbox(label="الإجابة", dir="rtl")
     btn = gr.Button("إجابة")
     btn.click(fn=answer_question, inputs=inp, outputs=out)
+# Launch Gradio app (Hugging Face Spaces will handle this automatically)
+demo.launch(server_name="0.0.0.0", server_port=7860)