Spaces:

Adillega
/

AdIlleagal

Sleeping

App Files Files Community

Dhom1 commited on Jul 13

Commit

4843d43

verified ·

1 Parent(s): d2dddfc

Update src/streamlit_app.py

Browse files

Files changed (1) hide show

src/streamlit_app.py +75 -42

src/streamlit_app.py CHANGED Viewed

@@ -1,7 +1,6 @@
 import os
 import streamlit as st
 import pandas as pd
-from io import StringIO
 from transformers import pipeline
 import joblib
@@ -9,70 +8,106 @@ import joblib
 os.environ["HF_HOME"] = "/tmp"
 os.environ["TRANSFORMERS_CACHE"] = "/tmp"
-# ---- تحميل نموذج التصنيف العربي ----
 @st.cache_resource
 def load_classifier():
-    return joblib.load("src/job_classifier.pkl")  # تأكد من المسار الصحيح
-classifier = load_classifier()
-# ---- تحميل نموذج GPT-2 ----
 @st.cache_resource
 def load_gpt2():
     return pipeline("text-generation", model="gpt2", model_kwargs={"cache_dir": "/tmp"})
 gpt2_pipeline = load_gpt2()
-# ---- إعداد صفحة Streamlit ----
-st.set_page_config(page_title="رصد الإعلانات المخالفة")
-st.title("📢 نظام رصد الإعلانات المخالفة")
 st.markdown("""
-### 🧠 هذا النظام يستخدم الذكاء الاصطناعي لرصد الإعلانات المخالفة
-ارفع نص إعلان وسنقوم بتحليله واكتشاف أي محتوى مخالف بناءً على قواعد محددة.
-""")
-# ---- رفع نص الإعلان ----
 uploaded_text = st.text_area("✍️ أدخل نص الإعلان هنا:", height=150)
-# ---- تصنيف الإعلان باستخدام النموذج ----
-st.subheader("📊 تصنيف الإعلان باستخدام نموذج التعلم الآلي")
 if uploaded_text:
     try:
         pred = classifier.predict([uploaded_text])[0]
         label = "✅ إعلان سليم" if pred == 1 else "❌ إعلان مخالف"
-        st.info(f"نتيجة النموذج: {label}")
     except Exception as e:
-        st.error(f"حدث خطأ في التنبؤ بالنموذج: {str(e)}")
-# ---- قاعدة بيانات كلمات/عبارات مخالفة ----
 offensive_keywords = [
     "مطلوب سعودية", "مظهر لائق", "براتب 1500", "للرجال فقط", "بدون عقد",
     "يفضل سعودية", "شرط العمر", "جنسية معينة", "تحمل ضغط العمل", "الوظيفة للذكور فقط"
 ]
-# ---- تحليل النص باستخدام الكلمات المفتاحية ----
-if st.button("🔍 تحليل الإعلان") and uploaded_text:
-    violations = [kw for kw in offensive_keywords if kw in uploaded_text]
-    if violations:
-        st.error("❌ الإعلان يحتوي على عبارات مخالفة!")
-        st.write("**العبارات المكتشفة:**")
-        for v in violations:
-            st.write(f"- {v}")
-        violation_score = min(5 + len(violations) * 20, 95)
-    else:
-        st.success("✅ الإعلان لا يحتوي على عبارات مخالفة ظاهرة.")
-        violation_score = 5
-    st.metric(label="نسبة المخالفة المتوقعة", value=f"{violation_score}%")
-# ---- توليد توصيات باستخدام GPT-2 ----
-st.subheader("🧠 توصيات الذكاء الاصطناعي (GPT-2)")
 if uploaded_text:
-    gpt_prompt = f"""
 You are an AI that checks for violations in job advertisements based on Saudi labor laws.
 Here is the ad:
 \"{uploaded_text}\"
@@ -80,11 +115,9 @@ Here is the ad:
 Please identify any potential violations and give recommendations to fix them.
 Violations:
 """
-    with st.spinner("يتم الآن تحليل الإعلان بواسطة GPT-2..."):
         try:
-            result = gpt2_pipeline(gpt_prompt, max_new_tokens=150)[0]["generated_text"]
-            st.success("✅ تم تحليل الإعلان")
-            st.text_area("📋 مخرجات GPT-2:", result, height=300)
         except Exception as e:
-            st.error(f"حدث خطأ أثناء استخدام GPT-2: {str(e)}")

 import os
 import streamlit as st
 import pandas as pd
 from transformers import pipeline
 import joblib
 os.environ["HF_HOME"] = "/tmp"
 os.environ["TRANSFORMERS_CACHE"] = "/tmp"
 @st.cache_resource
 def load_classifier():
+    return joblib.load("src/job_classifier.pkl")
 @st.cache_resource
 def load_gpt2():
     return pipeline("text-generation", model="gpt2", model_kwargs={"cache_dir": "/tmp"})
+classifier = load_classifier()
 gpt2_pipeline = load_gpt2()
+# ✅ إعداد الصفحة
+st.set_page_config(page_title="نظام رصد الإعلانات", layout="wide")
+# ✅ تنسيق CSS مستوحى من الهاكاثون
 st.markdown("""
+<style>
+body {
+    background-color: #f6f9fc;
+    font-family: 'Segoe UI', sans-serif;
+}
+h1, h2, h3 {
+    color: #004c97;
+}
+.stButton > button {
+    background: linear-gradient(90deg, #007bff, #00b8a9);
+    color: white;
+    font-weight: 600;
+    border-radius: 8px;
+    padding: 0.6em 1.4em;
+    border: none;
+}
+.stButton > button:hover {
+    transform: scale(1.03);
+}
+.stTextArea textarea {
+    background-color: #ffffff;
+    border-radius: 10px;
+    border: 1px solid #d0d7de;
+    padding: 12px;
+}
+.metric-container {
+    background-color: white;
+    padding: 20px;
+    border-radius: 12px;
+    box-shadow: 0 2px 8px rgba(0,0,0,0.05);
+    margin-top: 20px;
+}
+</style>
+""", unsafe_allow_html=True)
+# ✅ رأس الصفحة
+col1, col2 = st.columns([1, 6])
+with col1:
+    st.image("https://www.healthmatrixcorp.com/web/image/website/1/logo/Health%20Matrix?unique=956ad7b", width=120)
+with col2:
+    st.markdown("""
+        <h1>📢 نظام رصد الإعلانات المخالفة</h1>
+        <p style="color:#5BA241; margin-top: -10px;">تحليل ذكي يستند إلى القوانين السعودية</p>
+    """, unsafe_allow_html=True)
+# ✅ إدخال الإعلان
 uploaded_text = st.text_area("✍️ أدخل نص الإعلان هنا:", height=150)
+# ✅ نموذج التصنيف
+st.subheader("📊 تصنيف الإعلان")
 if uploaded_text:
     try:
         pred = classifier.predict([uploaded_text])[0]
         label = "✅ إعلان سليم" if pred == 1 else "❌ إعلان مخالف"
+        st.markdown(f'<div class="metric-container"><h4>{label}</h4></div>', unsafe_allow_html=True)
     except Exception as e:
+        st.error(f"حدث خطأ في التنبؤ: {str(e)}")
+# ✅ كلمات مخالفة
 offensive_keywords = [
     "مطلوب سعودية", "مظهر لائق", "براتب 1500", "للرجال فقط", "بدون عقد",
     "يفضل سعودية", "شرط العمر", "جنسية معينة", "تحمل ضغط العمل", "الوظيفة للذكور فقط"
 ]
+if st.button("🔍 تحليل العبارات"):
+    if uploaded_text:
+        violations = [kw for kw in offensive_keywords if kw in uploaded_text]
+        if violations:
+            st.error("❌ الإعلان يحتوي على عبارات مخالفة:")
+            for v in violations:
+                st.markdown(f"<li style='color:#b00020'>{v}</li>", unsafe_allow_html=True)
+            violation_score = min(5 + len(violations) * 20, 95)
+        else:
+            st.success("✅ لا توجد عبا��ات مخالفة.")
+            violation_score = 5
+        st.metric(label="نسبة المخالفة المتوقعة", value=f"{violation_score}%")
+# ✅ توصيات GPT-2
+st.subheader("💡 توصيات الذكاء الاصطناعي")
 if uploaded_text:
+    prompt = f"""
 You are an AI that checks for violations in job advertisements based on Saudi labor laws.
 Here is the ad:
 \"{uploaded_text}\"
 Please identify any potential violations and give recommendations to fix them.
 Violations:
 """
+    with st.spinner("📡 جاري التحليل..."):
         try:
+            result = gpt2_pipeline(prompt, max_new_tokens=150)[0]["generated_text"]
+            st.text_area("📋 نتائج GPT-2:", result, height=300)
         except Exception as e:
+            st.error(f"خطأ في توليد النتائج: {str(e)}")