Spaces:

xTHExBEASTx
/

Islamic-Web-AI

Sleeping

App Files Files Community

xTHExBEASTx commited on Mar 2

Commit

ecc164c

verified ·

1 Parent(s): 08507f7

Update app.py

Browse files

Files changed (1) hide show

app.py +37 -113

app.py CHANGED Viewed

@@ -1,128 +1,52 @@
-import gradio as gr
 import requests
 from bs4 import BeautifulSoup
 from googlesearch import search
 from huggingface_hub import InferenceClient
-from langdetect import detect
 import os
-# محاولة جلب التوكن من الإعدادات
-hf_token = os.getenv("HF_TOKEN")
-client = InferenceClient("google/gemma-3-4b-it", token=hf_token)
-def get_language(text):
     try:
-        return detect(text)
     except:
-        return "ar"
-def search_islamweb(query):
-    print(f"جاري البحث عن: {query}")
-    full_query = f"site:islamweb.net {query}"
-    try:
-        # الإصدار الجديد يستخدم num_results بدلاً من num و stop
-        links = []
-        results = search(full_query, num_results=3, lang="ar")
-        for link in results:
-            links.append(link)
-        print(f"الروابط المستخرجة: {links}")
-        return links
-    except Exception as e:
-        print(f"فشل البحث في جوجل: {e}")
-        return []
-def scrape_content(url):
-    try:
-        print(f"جاري استخراج محتوى: {url}")
-        headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36'}
-        response = requests.get(url, headers=headers, timeout=10)
-        response.encoding = 'utf-8'
-        soup = BeautifulSoup(response.text, 'html.parser')
-        # بنية إسلام ويب قد تختلف، نحاول أكثر من مكان
-        main_content = soup.find('div', {'class': 'item'}) or soup.find('div', {'id': 'fullitem'}) or soup.find('article')
-        if main_content:
-            text = main_content.get_text(strip=True)[:4000]
-            print("تم استخراج النص بنجاح.")
-            return text
-        return ""
-    except Exception as e:
-        print(f"فشل الاستخراج: {e}")
-        return ""
-def islamic_ai_search(question):
-    if not question.strip():
-        yield "الرجاء كتابة سؤال أولاً.", ""
-        return
-    lang = get_language(question)
-    # 1. البحث عن الروابط
-    links = search_islamweb(question)
-    if not links:
-        yield "عذراً، جوجل حظر طلب البحث حالياً. جرب مرة أخرى بعد قليل أو تأكد من إعدادات البحث.", ""
-        return
-    # 2. استخراج السياق
-    context = ""
-    source_link = ""
-    for link in links:
-        content = scrape_content(link)
-        if len(content) > 150:
-            context = content
-            source_link = link
-            break
     if not context:
-        yield "لم أتمكن من قراءة محتوى الفتوى من الروابط الموجودة.", ""
-        return
-    # 3. نظام الرسائل للنموذج
-    system_message = (
-        "You are an expert Islamic researcher. Answer the user's question ONLY using the provided context from IslamWeb. "
-        "Strict rules: \n"
-        "1. If the answer is not in the context, say you don't know.\n"
-        "2. Response language MUST be the same as input question language.\n"
-        f"Context: {context}"
-    )
-    # 4. طلب الإجابة (Streaming)
-    response = ""
-    try:
-        for message in client.chat_completion(
-            messages=[
-                {"role": "system", "content": system_message},
-                {"role": "user", "content": question}
-            ],
-            max_tokens=1000,
-            stream=True,
-        ):
-            token = message.choices[0].delta.content
-            if token:
-                response += token
-                yield response, source_link
-    except Exception as e:
-        print(f"خطأ الـ AI: {e}")
-        yield f"حدث خطأ أثناء توليد الإجابة. تأكد من إضافة HF_TOKEN في الـ Secrets. الخطأ: {e}", source_link
-# واجهة Gradio
-with gr.Blocks() as demo:
-    gr.Markdown("# 🕋 الباحث الإسلامي الذكي")
-    with gr.Row():
-        input_text = gr.Textbox(label="سؤالك / Sorunuz")
-    submit_btn = gr.Button("بحث وتحليل", variant="primary")
-    output_answer = gr.Markdown(label="الإجابة")
-    output_source = gr.Textbox(label="المصدر الأصلي")
-    submit_btn.click(
-        fn=islamic_ai_search,
-        inputs=input_text,
-        outputs=[output_answer, output_source]
     )
-demo.queue().launch()

+from fastapi import FastAPI
 import requests
 from bs4 import BeautifulSoup
 from googlesearch import search
 from huggingface_hub import InferenceClient
 import os
+app = FastAPI()
+client = InferenceClient("google/gemma-3-4b-it", token=os.getenv("HF_TOKEN"))
+def search_and_scrape(question):
+    # نفس منطق البحث والاستخراج السابق
+    full_query = f"site:islamweb.net {question}"
     try:
+        results = search(full_query, num_results=1, lang="ar")
+        link = next(results)
+        headers = {'User-Agent': 'Mozilla/5.0'}
+        resp = requests.get(link, headers=headers, timeout=5)
+        soup = BeautifulSoup(resp.text, 'html.parser')
+        content = soup.find('div', {'class': 'item'}).get_text(strip=True)[:3000]
+        return content, link
     except:
+        return None, None
+@app.post("/ask")
+async def ask_ai(data: dict):
+    question = data.get("question")
+    context, link = search_and_scrape(question)
     if not context:
+        return {"answer": "لم أجد نتائج.", "source": ""}
+    system_msg = f"Answer only from context: {context}"
+    # طلب الإجابة من الموديل
+    response = client.chat_completion(
+        messages=[
+            {"role": "system", "content": system_msg},
+            {"role": "user", "content": question}
+        ],
+        max_tokens=500
     )
+    return {
+        "answer": response.choices[0].message.content,
+        "source": link
+    }
+# تشغيل FastAPI بدلاً من Gradio
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=7860)