Spaces:

absence404
/

securebot

Running

App Files Files Community

absence404 commited on 2 days ago

Commit

f21361a

verified ·

1 Parent(s): 50abaa4

Upload 4 files

Browse files

Files changed (4) hide show

Dockerfile +12 -0
backend/classifier.py +32 -0
backend/main.py +44 -0
requirements.txt +87 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,12 @@

+FROM python:3.12-slim
+WORKDIR /app
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY backend/ ./backend/
+EXPOSE 7860
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "7860"]

backend/classifier.py ADDED Viewed

	@@ -0,0 +1,32 @@

+from transformers import pipeline
+classifier = pipeline(
+    "text-classification",
+    model="protectai/deberta-v3-base-prompt-injection-v2",
+    device=-1
+)
+def detect_injection(user_input: str) -> dict:
+    result = classifier(user_input)[0]
+    label = result["label"]
+    score = result["score"]
+    suspicious_keywords = [
+        "ignore previous instructions",
+        "hack the system",
+        "disregard your system prompt",
+        "you are now",
+        "forget everything",
+        "act as",
+        "jailbreak"
+    ]
+    rule_triggered = any(kw in user_input.lower() for kw in suspicious_keywords)
+    is_malicious = (label == "INJECTION" and score > 0.85) or rule_triggered
+    return {
+        "input": user_input,
+        "label": label,
+        "confidence": round(score, 3),
+        "rule_triggered": rule_triggered,
+        "is_malicious": is_malicious
+    }

backend/main.py ADDED Viewed

	@@ -0,0 +1,44 @@

+from fastapi import FastAPI
+from fastapi.middleware.cors import CORSMiddleware
+from pydantic import BaseModel
+from classifier import detect_injection
+from groq import Groq
+from dotenv import load_dotenv
+import os
+load_dotenv(dotenv_path="../.env")
+app = FastAPI()
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+client = Groq(api_key=os.getenv("GROQ_API_KEY"))
+class ChatRequest(BaseModel):
+    message: str
+@app.post("/chat")
+def chat(req: ChatRequest):
+    detection = detect_injection(req.message)
+    if detection["is_malicious"]:
+        return {
+            "response": "Prompt injection detected. Request blocked.",
+            "flagged": True,
+            "detection": detection
+        }
+    completion = client.chat.completions.create(
+        model="llama-3.3-70b-versatile",
+        messages=[
+            {"role": "system", "content": "You are a helpful customer support assistant. You help users with order issues, and general inquiries. You do not have access to internal systems or user account data.If you cannot help, politely direct the user to contact support@company.com. Your return policy is 30 days. The order is dispatched and should arrive in 2-5 days"},
+            {"role": "user", "content": req.message}
+        ]
+    )
+    return {
+        "response": completion.choices[0].message.content,
+        "flagged": False,
+        "detection": detection
+    }

requirements.txt ADDED Viewed

	@@ -0,0 +1,87 @@

+aiohappyeyeballs==2.6.1
+aiohttp==3.13.3
+aiosignal==1.4.0
+altair==6.0.0
+annotated-doc==0.0.4
+annotated-types==0.7.0
+anyio==4.12.1
+attrs==25.4.0
+blinker==1.9.0
+cachetools==6.2.6
+certifi==2026.2.25
+charset-normalizer==3.4.4
+click==8.3.1
+datasets==4.6.1
+dill==0.4.0
+distro==1.9.0
+fastapi==0.134.0
+filelock==3.24.3
+frozenlist==1.8.0
+fsspec==2026.2.0
+gitdb==4.0.12
+GitPython==3.1.46
+groq==1.0.0
+h11==0.16.0
+hf-xet==1.3.2
+httpcore==1.0.9
+httpx==0.28.1
+huggingface_hub==1.5.0
+idna==3.11
+Jinja2==3.1.6
+jiter==0.13.0
+jsonschema==4.26.0
+jsonschema-specifications==2025.9.1
+markdown-it-py==4.0.0
+MarkupSafe==3.0.3
+mdurl==0.1.2
+mpmath==1.3.0
+multidict==6.7.1
+multiprocess==0.70.18
+narwhals==2.17.0
+networkx==3.6.1
+numpy==2.4.2
+openai==2.24.0
+packaging==26.0
+pandas==2.3.3
+pillow==12.1.1
+propcache==0.4.1
+protobuf==6.33.5
+pyarrow==23.0.1
+pydantic==2.12.5
+pydantic_core==2.41.5
+pydeck==0.9.1
+Pygments==2.19.2
+python-dateutil==2.9.0.post0
+python-dotenv==1.2.1
+pytz==2025.2
+PyYAML==6.0.3
+referencing==0.37.0
+regex==2026.2.28
+requests==2.32.5
+rich==14.3.3
+rpds-py==0.30.0
+safetensors==0.7.0
+setuptools==82.0.0
+shellingham==1.5.4
+six==1.17.0
+smmap==5.0.2
+sniffio==1.3.1
+starlette==0.52.1
+streamlit==1.54.0
+sympy==1.14.0
+tenacity==9.1.4
+tokenizers==0.22.2
+toml==0.10.2
+torch==2.10.0
+tornado==6.5.4
+tqdm==4.67.3
+transformers==5.2.0
+typer==0.24.1
+typer-slim==0.24.0
+typing-inspection==0.4.2
+typing_extensions==4.15.0
+tzdata==2025.3
+urllib3==2.6.3
+uvicorn==0.41.0
+xxhash==3.6.0
+yarl==1.22.0