Spaces:

safiaa02
/

PromptShield_AI

Sleeping

App Files Files Community

safiaa02 commited on Sep 23, 2025

Commit

6d14e0b

verified ·

1 Parent(s): b1c09b6

Create app.py

Browse files

Files changed (1) hide show

app.py +91 -0

app.py ADDED Viewed

	@@ -0,0 +1,91 @@

+import gradio as gr
+from groq import Groq
+import os
+# ⚠️ IMPORTANT: Set your Groq API key in Hugging Face Spaces "Secrets"
+# os.environ["GROQ_API_KEY"] = "your_api_key_here"
+client = Groq(api_key=os.environ.get("GROQ_API_KEY"))
+def analyze_prompt(user_prompt):
+    if not user_prompt.strip():
+        return "⚠️ Please enter a prompt to analyze.", "", "", ""
+    # Step 1: Detect vulnerability type
+    detection_prompt = f"""
+    You are an AI security analyst.
+    Analyze the following prompt for potential vulnerabilities against large language models.
+    Consider these categories:
+    - Prompt Injection
+    - Jailbreak / Safety Bypass
+    - Data Leakage Attempt
+    - Harmful or Offensive Request
+    - Hallucination Risk
+    - Safe / Low Risk
+    For each detected issue, provide:
+    - Detected Vulnerability Type(s)
+    - Risk Level (Low, Medium, High)
+    - Short Explanation (1–2 sentences)
+    Prompt to analyze:
+    {user_prompt}
+    """
+    detection_response = client.chat.completions.create(
+        messages=[{"role": "user", "content": detection_prompt}],
+        model="llama-3.1-8b-instant"
+    )
+    analysis = detection_response.choices[0].message.content.strip()
+    # Step 2: Suggest a safer reformulation of the prompt
+    rewrite_prompt = f"""
+    Rewrite the following prompt in a safer and responsible way
+    that removes any security risks but keeps the learning intent.
+    Prompt:
+    {user_prompt}
+    """
+    rewrite_response = client.chat.completions.create(
+        messages=[{"role": "user", "content": rewrite_prompt}],
+        model="llama-3.1-8b-instant"
+    )
+    safer_prompt = rewrite_response.choices[0].message.content.strip()
+    return user_prompt, analysis, safer_prompt, "✅ Analysis complete."
+# 🚀 Gradio UI
+with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    gr.Markdown("## 🔐 LLM Vulnerability Tester")
+    gr.Markdown(
+        "Test your prompts for **AI security risks** (prompt injection, jailbreaks, data leakage, etc.).\n"
+        "This tool provides a **risk analysis** and a **safer reformulation**."
+    )
+    with gr.Row():
+        prompt_input = gr.Textbox(
+            label="Enter Prompt to Test",
+            placeholder="Type or paste your LLM prompt here...",
+            lines=6
+        )
+    analyze_btn = gr.Button("🔍 Analyze Prompt")
+    with gr.Row():
+        original_out = gr.Textbox(label="Original Prompt", lines=6)
+        analysis_out = gr.Textbox(label="Vulnerability Analysis", lines=8)
+        safer_out = gr.Textbox(label="Safer Reformulation", lines=6)
+        status_out = gr.Textbox(label="Status", lines=1)
+    analyze_btn.click(
+        analyze_prompt,
+        inputs=[prompt_input],
+        outputs=[original_out, analysis_out, safer_out, status_out]
+    )
+if __name__ == "__main__":
+    demo.launch()