Spaces:

Shirjannn
/

Philsof

Sleeping

App Files Files Community

Shirjannn commited on Aug 16, 2025

Commit

62e6a56

verified ·

1 Parent(s): 820d22d

Update app.py

Browse files

Files changed (1) hide show

app.py +37 -68

app.py CHANGED Viewed

@@ -1,73 +1,42 @@
 import gradio as gr
-import numpy as np
 import pandas as pd
-import zipfile, os
-from sklearn.metrics.pairwise import cosine_similarity
-from sentence_transformers import SentenceTransformer
-from sklearn.decomposition import PCA
-import plotly.graph_objects as go
-# مدل زبانی
-model = SentenceTransformer('paraphrase-multilingual-MiniLM-L12-v2')
-# مسیر فایل ZIP
-zip_path = "school_data.zip"
-extract_folder = "school_data"
-# استخراج ZIP اگر هنوز استخراج نشده
-if not os.path.exists(extract_folder):
-    with zipfile.ZipFile(zip_path, "r") as zip_ref:
-        zip_ref.extractall(extract_folder)
-# لود دیتای CSV ها
-school_data_dynamic = {}
-for file in os.listdir(extract_folder):
-    if file.endswith(".csv"):
-        df = pd.read_csv(os.path.join(extract_folder, file))
-        # فرض: ستون اول = key ، ستون دوم = متن
-        if df.shape[1] >= 2:
-            for _, row in df.iterrows():
-                key = str(row[0])
-                value = str(row[1])
-                school_data_dynamic[key] = value
-# تبدیل دیتای متنی به embedding
-texts = list(school_data_dynamic.values())
-keys = list(school_data_dynamic.keys())
-embeddings = model.encode(texts, convert_to_tensor=False)
-# کاهش ابعاد برای رسم
-pca = PCA(n_components=2)
-reduced_embeddings = pca.fit_transform(embeddings)
-# تابع جستجو
-def search(query):
-    query_emb = model.encode([query], convert_to_tensor=False)
-    sims = cosine_similarity([query_emb[0]], embeddings)[0]
-    top_idx = np.argmax(sims)
-    return f"Closest match: {keys[top_idx]} → {texts[top_idx]}"
-# تابع برای رسم گراف
-def plot_embeddings():
-    fig = go.Figure()
-    fig.add_trace(go.Scatter(
-        x=reduced_embeddings[:,0],
-        y=reduced_embeddings[:,1],
-        mode="markers+text",
-        text=keys,
-        textposition="top center"
-    ))
-    return fig
-# رابط Gradio
 with gr.Blocks() as demo:
-    gr.Markdown("# 🔍 Semantic Search in School Data")
-    inp = gr.Textbox(label="Enter your query")
-    out = gr.Textbox(label="Best Match")
-    btn = gr.Button("Search")
-    graph = gr.Plot(label="Embedding Visualization")
-    btn.click(fn=search, inputs=inp, outputs=out)
-    demo.load(fn=plot_embeddings, inputs=None, outputs=graph)
 demo.launch()

 import gradio as gr
 import pandas as pd
+import os
+# مسیر CSV
+csv_path = "stoic_quotes_full.csv"
+# بارگذاری داده‌ها
+def load_data():
+    if not os.path.exists(csv_path):
+        return None
+    return pd.read_csv(csv_path)
+# تحلیل متن
+def analyze_text(text):
+    df = load_data()
+    if df is None:
+        return "❌ دیتابیس پیدا نشد."
+    text = text.strip().lower()
+    if not text:
+        return "⚠️ لطفاً یک متن وارد کنید."
+    # جستجو در نقل‌قول‌ها
+    match = df[df['quote'].str.lower() == text]
+    if not match.empty:
+        philosopher = match.iloc[0]['philosopher']
+        return f"✅ این جمله از {philosopher} است."
+    else:
+        return "❌ این جمله در دیتاست وجود ندارد."
+# رابط کاربری
 with gr.Blocks() as demo:
+    gr.Markdown("## متن فلسفی را وارد کنید")
+    text_input = gr.Textbox(label="متن")
+    analyze_btn = gr.Button("تحلیل")
+    output = gr.Textbox(label="نتیجه")
+    analyze_btn.click(analyze_text, inputs=text_input, outputs=output)
 demo.launch()