Spaces:

AmnaHassan
/

infoSecProject

Sleeping

App Files Files Community

AmnaHassan commited on Feb 2

Commit

ea4398d

verified ·

1 Parent(s): bfd5a34

Update app.py

Browse files

Files changed (1) hide show

app.py +133 -88

app.py CHANGED Viewed

@@ -2,11 +2,12 @@ import streamlit as st
 import torch
 import torch.nn as nn
 import numpy as np
 import joblib
 import plotly.graph_objects as go
 # -----------------------------
-# Page config (premium look)
 # -----------------------------
 st.set_page_config(
     page_title="Cyber Threat Detection Dashboard",
@@ -15,11 +16,24 @@ st.set_page_config(
 )
 # -----------------------------
-# Title Section
 # -----------------------------
 st.markdown("""
-# 🛡️ Cyber Threat Detection Dashboard
-**Deep Learning–Based Suspicious Activity Detection**
 """)
 st.markdown("---")
@@ -28,11 +42,10 @@ st.markdown("---")
 # Load scaler
 # -----------------------------
 scaler = joblib.load("scaler.pkl")
-INPUT_DIM = scaler.mean_.shape[0]
 # -----------------------------
-# Model definition
-# (MUST match training exactly)
 # -----------------------------
 model = nn.Sequential(
     nn.Linear(INPUT_DIM, 128),
@@ -48,88 +61,120 @@ model = nn.Sequential(
     nn.Linear(64, 1)
 )
-# -----------------------------
-# Load trained weights
-# -----------------------------
-state_dict = torch.load("model.pth", map_location="cpu")
-model.load_state_dict(state_dict)
 model.eval()
-# -----------------------------
-# Sidebar – Log Input
-# -----------------------------
-st.sidebar.header("🔍 Log Feature Input")
-features = []
-for i in range(INPUT_DIM):
-    val = st.sidebar.number_input(
-        f"Feature {i+1}",
-        value=0.0,
-        step=0.01
-    )
-    features.append(val)
-# -----------------------------
-# Prediction
-# -----------------------------
-if st.sidebar.button("🚨 Analyze Event"):
-    x = np.array(features).reshape(1, -1)
-    x_scaled = scaler.transform(x)
-    x_tensor = torch.tensor(x_scaled, dtype=torch.float32)
-    with torch.no_grad():
-        prob = torch.sigmoid(model(x_tensor)).item()
-    # -------------------------
-    # Risk level logic
-    # -------------------------
-    if prob > 0.7:
-        risk = "HIGH"
-        color = "red"
-        action = "Immediate investigation required. Isolate affected system."
-    elif prob > 0.4:
-        risk = "MEDIUM"
-        color = "orange"
-        action = "Monitor closely. Correlate with other logs."
-    else:
-        risk = "LOW"
-        color = "green"
-        action = "No action required. Log for auditing."
-    # -------------------------
-    # Main dashboard layout
-    # -------------------------
-    col1, col2, col3 = st.columns(3)
-    col1.metric("Risk Level", risk)
-    col2.metric("Suspicion Probability", f"{prob:.2f}")
-    col3.metric("Recommended Action", action)
-    # -------------------------
-    # Gauge chart
-    # -------------------------
-    fig = go.Figure(go.Indicator(
-        mode="gauge+number",
-        value=prob * 100,
-        title={'text': "Threat Confidence (%)"},
-        gauge={
-            'axis': {'range': [0, 100]},
-            'bar': {'color': color},
-            'steps': [
-                {'range': [0, 40], 'color': "lightgreen"},
-                {'range': [40, 70], 'color': "orange"},
-                {'range': [70, 100], 'color': "red"}
-            ],
-        }
-    ))
-    st.plotly_chart(fig, use_container_width=True)
-    # -------------------------
-    # Explanation block
-    # -------------------------
-    st.markdown("### 🧠 Model Interpretation")
-    st.info(
-        "The model analyzes behavioral patterns in system logs and assigns a risk score "
-        "based on learned representations of malicious activity from the BETH dataset."
     )

 import torch
 import torch.nn as nn
 import numpy as np
+import pandas as pd
 import joblib
 import plotly.graph_objects as go
 # -----------------------------
+# Page config
 # -----------------------------
 st.set_page_config(
     page_title="Cyber Threat Detection Dashboard",
 )
 # -----------------------------
+# Feature names (MUST match training order)
+# -----------------------------
+FEATURE_COLUMNS = [
+    "processId",
+    "threadId",
+    "parentProcessId",
+    "userId",
+    "mountNamespace",
+    "argsNum",
+    "returnValue"
+]
+# -----------------------------
+# Title
 # -----------------------------
 st.markdown("""
+# 🛡️ Cyber Threat Detection Dashboard
+**SOC-Style Deep Learning–Based Suspicious Activity Detection**
 """)
 st.markdown("---")
 # Load scaler
 # -----------------------------
 scaler = joblib.load("scaler.pkl")
+INPUT_DIM = len(FEATURE_COLUMNS)
 # -----------------------------
+# Model (EXACT training architecture)
 # -----------------------------
 model = nn.Sequential(
     nn.Linear(INPUT_DIM, 128),
     nn.Linear(64, 1)
 )
+model.load_state_dict(torch.load("model.pth", map_location="cpu"))
 model.eval()
+# =============================
+# SIDEBAR
+# =============================
+st.sidebar.header("🔍 Analysis Mode")
+mode = st.sidebar.radio(
+    "Choose input type",
+    ["Single Log Event", "Upload CSV (Batch Analysis)"]
+)
+# =============================
+# SINGLE EVENT MODE
+# =============================
+if mode == "Single Log Event":
+    st.sidebar.subheader("Log Features")
+    features = []
+    for col in FEATURE_COLUMNS:
+        val = st.sidebar.number_input(col, value=0)
+        features.append(val)
+    if st.sidebar.button("🚨 Analyze Event"):
+        x = np.array(features).reshape(1, -1)
+        x_scaled = scaler.transform(x)
+        x_tensor = torch.tensor(x_scaled, dtype=torch.float32)
+        with torch.no_grad():
+            prob = torch.sigmoid(model(x_tensor)).item()
+        # Risk logic
+        if prob > 0.7:
+            risk = "HIGH"
+            color = "red"
+            action = "Immediate investigation required. Isolate affected system."
+        elif prob > 0.4:
+            risk = "MEDIUM"
+            color = "orange"
+            action = "Monitor closely. Correlate with other logs."
+        else:
+            risk = "LOW"
+            color = "green"
+            action = "No action required. Log for auditing."
+        col1, col2, col3 = st.columns(3)
+        col1.metric("Risk Level", risk)
+        col2.metric("Suspicion Probability", f"{prob:.2f}")
+        col3.metric("Recommended Action", action)
+        fig = go.Figure(go.Indicator(
+            mode="gauge+number",
+            value=prob * 100,
+            title={'text': "Threat Confidence (%)"},
+            gauge={
+                'axis': {'range': [0, 100]},
+                'bar': {'color': color},
+                'steps': [
+                    {'range': [0, 40], 'color': "lightgreen"},
+                    {'range': [40, 70], 'color': "orange"},
+                    {'range': [70, 100], 'color': "red"}
+                ],
+            }
+        ))
+        st.plotly_chart(fig, use_container_width=True)
+# =============================
+# CSV UPLOAD MODE
+# =============================
+else:
+    st.subheader("📄 Batch Log Analysis")
+    uploaded_file = st.file_uploader(
+        "Upload CSV file (validation/test logs)",
+        type=["csv"]
     )
+    if uploaded_file:
+        df = pd.read_csv(uploaded_file)
+        # Drop label column if present
+        if "sus_label" in df.columns:
+            df = df.drop(columns=["sus_label"])
+        # Ensure correct columns
+        missing = set(FEATURE_COLUMNS) - set(df.columns)
+        if missing:
+            st.error(f"Missing required columns: {missing}")
+        else:
+            df = df[FEATURE_COLUMNS]  # enforce correct order
+            X_scaled = scaler.transform(df.values)
+            X_tensor = torch.tensor(X_scaled, dtype=torch.float32)
+            with torch.no_grad():
+                probs = torch.sigmoid(model(X_tensor)).numpy().flatten()
+            df["suspicion_probability"] = probs
+            df["risk_level"] = df["suspicion_probability"].apply(
+                lambda p: "HIGH" if p > 0.7 else "MEDIUM" if p > 0.4 else "LOW"
+            )
+            st.success("Batch analysis completed")
+            st.dataframe(df, use_container_width=True)
+            st.markdown("### 📊 Risk Distribution")
+            st.bar_chart(df["risk_level"].value_counts())
+# =============================
+# Footer
+# =============================
+st.markdown("---")
+st.info(
+    "This dashboard simulates a Security Operations Center (SOC) workflow by "
+    "analyzing system logs using a deep learning model trained on the BETH dataset."
+)