smart-moderator

Sleeping

App Files Files Community

nixaut-codelabs commited on Aug 21, 2025

Commit

f2361fc

verified ·

1 Parent(s): 5a39cfb

Update app.py

Browse files

Files changed (1) hide show

app.py +43 -60

app.py CHANGED Viewed

@@ -6,12 +6,11 @@ import gradio as gr
 from huggingface_hub import snapshot_download
 from transformers import AutoTokenizer, AutoModelForCausalLM, TextIteratorStreamer
-# --- Model ve Ortam Ayarları (Değişiklik yok) ---
 MODEL_REPO = "daniel-dona/gemma-3-270m-it"
 LOCAL_DIR = os.path.join(os.getcwd(), "local_model")
 os.environ.setdefault("HF_HUB_ENABLE_HF_TRANSFER", "1")
-os.environ.setdefault("OMP_NUM_THREADS", str(os.cpu_count() or 2))
 os.environ.setdefault("MKL_NUM_THREADS", os.environ["OMP_NUM_THREADS"])
 os.environ.setdefault("OMP_PROC_BIND", "TRUE")
@@ -74,20 +73,23 @@ MODERATION_SYSTEM_PROMPT = (
     "Otherwise respond 's'."
 )
-# --- Yardımcı Fonksiyonlar (Değişiklik yok) ---
 def build_prompt(message, max_ctx_tokens=128):
     full_user_message = f"{MODERATION_SYSTEM_PROMPT}\n\nUser input: '{message}'"
     messages = [{"role": "user", "content": full_user_message}]
     text = tokenizer.apply_chat_template(
-        messages, tokenize=False, add_generation_prompt=True
     )
     while len(tokenizer(text, add_special_tokens=False).input_ids) > max_ctx_tokens and len(full_user_message) > 100:
         full_user_message = full_user_message[:-50]
         messages[0]['content'] = full_user_message
         text = tokenizer.apply_chat_template(
-            messages, tokenize=False, add_generation_prompt=True
         )
     return text
@@ -99,31 +101,24 @@ def enforce_s_u(text: str) -> str:
         return "u"
     return "s"
-# --- YENİ: Sonuçları Gradio bileşenlerine formatlayan fonksiyon ---
 def format_classification_result(classification, tokens_per_second, processing_time):
-    """
-    Sınıflandırma sonucunu birden fazla Gradio bileşenine uygun bir demet (tuple) olarak döndürür.
-    """
     if classification == "s":
-        label = {"label": "✅ GÜVENLİ", "confidences": [{"label": "GÜVENLİ", "confidence": 1.0}]}
-        description = "İçeriğin güvenli ve uygun olduğu tespit edildi."
     else:
-        label = {"label": "🚫 GÜVENLİ DEĞİL", "confidences": [{"label": "GÜVENLİ DEĞİL", "confidence": 1.0}]}
-        description = "İçerik, uygunsuz veya zararlı materyal barındırıyor olabilir."
     tps_str = f"{tokens_per_second:.1f} tok/s"
     time_str = f"{processing_time:.2f} s"
     return label, description, tps_str, time_str
-# --- GÜNCELLENDİ: Ana Sınıflandırma Fonksiyonu ---
 def classify_text_stream(message, max_tokens, temperature, top_p, progress=gr.Progress()):
     if not message.strip():
-        # HTML yerine yeni formatta varsayılan değerleri döndür
         return format_classification_result("s", 0, 0)
-    progress(0, desc="Sınıflandırma hazırlanıyor...")
     text = build_prompt(message)
     inputs = tokenizer([text], return_tensors="pt").to(model.device)
     do_sample = bool(temperature and temperature > 0.0)
@@ -151,7 +146,7 @@ def classify_text_stream(message, max_tokens, temperature, top_p, progress=gr.Pr
     token_count = 0
     start_time = None
-    progress(0.3, desc="İçerik işleniyor...")
     with torch.inference_mode():
         thread.start()
@@ -161,7 +156,7 @@ def classify_text_stream(message, max_tokens, temperature, top_p, progress=gr.Pr
                     start_time = time.time()
                 partial_text += chunk
                 token_count += 1
-                progress(0.3 + (token_count / max_tokens) * 0.6, desc="Analiz ediliyor...")
         finally:
             thread.join()
@@ -170,18 +165,15 @@ def classify_text_stream(message, max_tokens, temperature, top_p, progress=gr.Pr
     duration = max(1e-6, end_time - start_time)
     tps = token_count / duration if duration > 0 else 0.0
-    progress(1.0, desc="Tamamlandı!")
-    # HTML dizesi yerine, birden çok bileşen için bir demet (tuple) döndür
     return format_classification_result(final_label, tps, duration)
-# --- YENİ: Gradio Arayüzü (HTML/CSS olmadan) ---
-with gr.Blocks(title="AI İçerik Moderatörü", theme=gr.themes.Soft()) as demo:
     gr.Markdown(
         """
-        # 🛡️ AI İçerik Moderatörü
-        Yapay zeka ile güçlendirilmiş, çok dilli ve gelişmiş içerik sınıflandırma aracı.
         """
     )
@@ -189,90 +181,81 @@ with gr.Blocks(title="AI İçerik Moderatörü", theme=gr.themes.Soft()) as demo
         with gr.Column(scale=3):
             with gr.Group():
                 text_input = gr.Textbox(
-                    label="Analiz Edilecek Metin",
-                    placeholder="İçerik denetimi analizi için herhangi bir dilde metin girin...",
                     lines=8,
                     max_lines=15
                 )
                 with gr.Row():
-                    clear_btn = gr.Button("🗑️ Temizle", variant="secondary")
-                    classify_btn = gr.Button("🔍 Analiz Et", variant="primary", scale=2)
         with gr.Column(scale=2):
-            gr.Markdown("### 📊 Sınıflandırma Sonucu")
-            result_label = gr.Label(label="Durum", num_top_classes=1)
-            result_description = gr.Markdown(value="*Analiz için bir metin girip 'Analiz Et' butonuna tıklayın.*")
             with gr.Row():
-                tps_output = gr.Textbox(label="Performans (Token/sn)", interactive=False)
-                time_output = gr.Textbox(label="İşlem Süresi (sn)", interactive=False)
-    with gr.Accordion("⚙️ Gelişmiş Ayarlar", open=False):
         with gr.Row():
             max_tokens_slider = gr.Slider(
                 minimum=1, maximum=10, value=3, step=1,
-                label="Maksimum Token",
-                info="Modelin üreteceği maksimum token sayısı (genellikle 1-3 arası yeterlidir)"
             )
             temp_slider = gr.Slider(
                 minimum=0.0, maximum=1.0, value=0.1, step=0.1,
-                label="Sıcaklık (Temperature)",
-                info="Üretimdeki rastgeleliği kontrol eder"
             )
             top_p_slider = gr.Slider(
                 minimum=0.1, maximum=1.0, value=0.95, step=0.05,
                 label="Top-p",
-                info="Çekirdek örnekleme parametresi"
             )
-    gr.Markdown("### 💡 Örnekleri Deneyin")
     gr.Examples(
         examples=[
-            ["Merhaba, bugün nasılsın? Umarım harika bir gün geçiriyorsundur!"],
-            ["Senden nefret ediyorum, seni bulup canını çok yakacağım."],
             ["C'est une belle journée pour apprendre la programmation et l'intelligence artificielle."],
-            ["Artık dayanamıyorum. Her şeyi bitirip sonsuza dek yok olmak istiyorum."],
             ["¡Hola! Me encanta aprender nuevos idiomas y conocer diferentes culturas."],
-            ["Sen kesinlikle değersiz birisin ve kimse senin gibi birini sevmeyecek."]
         ],
         inputs=text_input,
-        label="Örnek Metinler"
     )
-    # --- Butonların Olay Yöneticileri ---
-    # Varsayılan durumu döndüren bir yardımcı fonksiyon
     def get_default_state():
-        default_label, default_desc, default_tps, default_time = format_classification_result("s", 0, 0)
-        # Etiketin boş görünmesi için başlangıçta None olarak ayarlıyoruz
-        return "", None, "*Analiz için bir metin girin.*", "0.0 tok/s", "0.00 s"
-    # classify_btn tıklandığında, birden fazla çıkışı günceller
     classify_btn.click(
         fn=classify_text_stream,
         inputs=[text_input, max_tokens_slider, temp_slider, top_p_slider],
         outputs=[result_label, result_description, tps_output, time_output]
     )
-    # clear_btn tıklandığında, hem girişi hem de tüm çıkışları temizler
     clear_btn.click(
         fn=get_default_state,
         outputs=[text_input, result_label, result_description, tps_output, time_output]
     )
-    # Arayüz ilk yüklendiğinde varsayılan durumu ayarla
     demo.load(
-        fn=lambda: (None, "*Analiz için bir metin girin.*", "0.0 tok/s", "0.00 s"),
         outputs=[result_label, result_description, tps_output, time_output]
     )
 if __name__ == "__main__":
-    # Modelin ilk çıkarım için ısınmasını sağla
     with torch.inference_mode():
         _ = model.generate(
-            **tokenizer(["Merhaba"], return_tensors="pt").to(model.device),
             max_new_tokens=1, do_sample=False, use_cache=True
         )
-    print("🚀 AI İçerik Moderatörü Başlatılıyor...")
     demo.queue(max_size=64).launch(
         server_name="0.0.0.0",
         server_port=7860,

 from huggingface_hub import snapshot_download
 from transformers import AutoTokenizer, AutoModelForCausalLM, TextIteratorStreamer
 MODEL_REPO = "daniel-dona/gemma-3-270m-it"
 LOCAL_DIR = os.path.join(os.getcwd(), "local_model")
 os.environ.setdefault("HF_HUB_ENABLE_HF_TRANSFER", "1")
+os.environ.setdefault("OMP_NUM_THREADS", str(os.cpu_count() or 1))
 os.environ.setdefault("MKL_NUM_THREADS", os.environ["OMP_NUM_THREADS"])
 os.environ.setdefault("OMP_PROC_BIND", "TRUE")
     "Otherwise respond 's'."
 )
 def build_prompt(message, max_ctx_tokens=128):
     full_user_message = f"{MODERATION_SYSTEM_PROMPT}\n\nUser input: '{message}'"
     messages = [{"role": "user", "content": full_user_message}]
     text = tokenizer.apply_chat_template(
+        messages,
+        tokenize=False,
+        add_generation_prompt=True
     )
     while len(tokenizer(text, add_special_tokens=False).input_ids) > max_ctx_tokens and len(full_user_message) > 100:
         full_user_message = full_user_message[:-50]
         messages[0]['content'] = full_user_message
         text = tokenizer.apply_chat_template(
+            messages,
+            tokenize=False,
+            add_generation_prompt=True
         )
     return text
         return "u"
     return "s"
 def format_classification_result(classification, tokens_per_second, processing_time):
     if classification == "s":
+        label = "✅ SAFE"
+        description = "Content appears to be safe and appropriate."
     else:
+        label = "🚫 UNSAFE"
+        description = "Content may contain inappropriate or harmful material."
     tps_str = f"{tokens_per_second:.1f} tok/s"
     time_str = f"{processing_time:.2f} s"
     return label, description, tps_str, time_str
 def classify_text_stream(message, max_tokens, temperature, top_p, progress=gr.Progress()):
     if not message.strip():
         return format_classification_result("s", 0, 0)
+    progress(0, desc="Preparing classification...")
     text = build_prompt(message)
     inputs = tokenizer([text], return_tensors="pt").to(model.device)
     do_sample = bool(temperature and temperature > 0.0)
     token_count = 0
     start_time = None
+    progress(0.3, desc="Processing content...")
     with torch.inference_mode():
         thread.start()
                     start_time = time.time()
                 partial_text += chunk
                 token_count += 1
+                progress(0.3 + (token_count / max_tokens) * 0.6, desc="Analyzing...")
         finally:
             thread.join()
     duration = max(1e-6, end_time - start_time)
     tps = token_count / duration if duration > 0 else 0.0
+    progress(1.0, desc="Complete!")
     return format_classification_result(final_label, tps, duration)
+with gr.Blocks(title="AI Content Moderator", theme=gr.themes.Soft()) as demo:
     gr.Markdown(
         """
+        # 🛡️ AI Content Moderator
+        An advanced, multilingual content classification tool powered by AI.
         """
     )
         with gr.Column(scale=3):
             with gr.Group():
                 text_input = gr.Textbox(
+                    label="Text to Analyze",
+                    placeholder="Enter any text in any language for content moderation analysis...",
                     lines=8,
                     max_lines=15
                 )
                 with gr.Row():
+                    clear_btn = gr.Button("🗑️ Clear", variant="secondary")
+                    classify_btn = gr.Button("🔍 Analyze Content", variant="primary", scale=2)
         with gr.Column(scale=2):
+            gr.Markdown("### 📊 Classification Result")
+            result_label = gr.Label(label="Status")
+            result_description = gr.Markdown(value="*Enter text and click 'Analyze Content' to see the result.*")
             with gr.Row():
+                tps_output = gr.Textbox(label="Performance (tok/s)", interactive=False)
+                time_output = gr.Textbox(label="Processing Time (s)", interactive=False)
+    with gr.Accordion("⚙️ Advanced Configuration", open=False):
         with gr.Row():
             max_tokens_slider = gr.Slider(
                 minimum=1, maximum=10, value=3, step=1,
+                label="Max New Tokens",
+                info="Maximum number of tokens for the model to generate (1-3 is usually sufficient)."
             )
             temp_slider = gr.Slider(
                 minimum=0.0, maximum=1.0, value=0.1, step=0.1,
+                label="Temperature",
+                info="Controls the randomness of the generation."
             )
             top_p_slider = gr.Slider(
                 minimum=0.1, maximum=1.0, value=0.95, step=0.05,
                 label="Top-p",
+                info="Nucleus sampling parameter."
             )
+    gr.Markdown("### 💡 Try These Examples")
     gr.Examples(
         examples=[
+            ["Hello, how are you today? I hope you're having a wonderful time!"],
+            ["I hate you and I will find you and hurt you badly."],
             ["C'est une belle journée pour apprendre la programmation et l'intelligence artificielle."],
+            ["I can't take this anymore. I want to end everything and disappear forever."],
             ["¡Hola! Me encanta aprender nuevos idiomas y conocer diferentes culturas."],
+            ["You're absolutely worthless and nobody will ever love someone like you."]
         ],
         inputs=text_input,
+        label="Example Prompts"
     )
     def get_default_state():
+        return "", None, "*Enter text and click 'Analyze Content' to see the result.*", "0.0 tok/s", "0.00 s"
     classify_btn.click(
         fn=classify_text_stream,
         inputs=[text_input, max_tokens_slider, temp_slider, top_p_slider],
         outputs=[result_label, result_description, tps_output, time_output]
     )
     clear_btn.click(
         fn=get_default_state,
         outputs=[text_input, result_label, result_description, tps_output, time_output]
     )
     demo.load(
+        fn=lambda: (None, "*Enter text and click 'Analyze Content' to see the result.*", "0.0 tok/s", "0.00 s"),
         outputs=[result_label, result_description, tps_output, time_output]
     )
 if __name__ == "__main__":
     with torch.inference_mode():
         _ = model.generate(
+            **tokenizer(["Hello"], return_tensors="pt").to(model.device),
             max_new_tokens=1, do_sample=False, use_cache=True
         )
+    print("🚀 Starting AI Content Moderator...")
     demo.queue(max_size=64).launch(
         server_name="0.0.0.0",
         server_port=7860,