Spaces:

vibesecurityguy
/

veris-classifier

Running on Zero

App Files Files Community

veris-classifier / app.py

vibesecurityguy

Upload app.py with huggingface_hub

cac9d59 verified 22 days ago

raw

history blame contribute delete

48.4 kB

	"""VERIS Classifier - Gradio Web Application.

	Dual-mode inference:
	- Primary: Fine-tuned Mistral-7B-Instruct on ZeroGPU (no API key needed)
	- Fallback: OpenAI API (user provides their own key)
	"""

	# ── HfFolder compatibility shim ──────────────────────────────────────────
	# Gradio's oauth.py imports HfFolder from huggingface_hub, but HfFolder was
	# removed in huggingface_hub >= 0.24. This shim must run BEFORE importing
	# Gradio so the import chain doesn't break.
	try:
	from huggingface_hub import HfFolder # noqa: F401
	except ImportError:
	import huggingface_hub

	class _HfFolder:
	"""Minimal shim for the removed HfFolder class."""

	@classmethod
	def get_token(cls):
	return huggingface_hub.get_token()

	@classmethod
	def save_token(cls, token):
	huggingface_hub.login(token=token)

	huggingface_hub.HfFolder = _HfFolder
	# ──────────────────────────────────────────────────────────────────────────

	import json
	import logging
	import os
	import csv
	import tempfile
	import time
	from importlib import metadata, util
	from typing import Any

	import gradio as gr
	from dotenv import load_dotenv

	from src.veris_classifier.classifier import (
	answer_question,
	classify_incident,
	)
	from src.veris_classifier.validator import validate_classification

	load_dotenv()
	logging.basicConfig(level=logging.INFO)
	logger = logging.getLogger(__name__)

	# ---------------------------------------------------------------------------
	# ZeroGPU support — only available on HF Spaces
	# ---------------------------------------------------------------------------
	IS_SPACES = os.getenv("SPACE_ID") is not None

	spaces = None
	if IS_SPACES:
	try:
	import spaces as _spaces

	# Local `spaces/` directory can shadow the HF `spaces` package.
	if hasattr(_spaces, "GPU"):
	spaces = _spaces
	else:
	raise ImportError("Imported `spaces` module has no GPU decorator")
	except Exception:
	try:
	# Load the installed HF spaces package directly from site-packages.
	dist = metadata.distribution("spaces")
	module_path = dist.locate_file("spaces/__init__.py")
	spec = util.spec_from_file_location("hf_spaces_runtime", module_path)
	if spec is None or spec.loader is None:
	raise ImportError("Could not load spaces package spec")
	_spaces = util.module_from_spec(spec)
	spec.loader.exec_module(_spaces)
	if hasattr(_spaces, "GPU"):
	spaces = _spaces
	else:
	raise ImportError("Installed spaces package has no GPU decorator")
	except Exception as e:
	logger.warning(
	"HF Spaces GPU decorator unavailable (%s). Falling back to non-GPU wrappers.",
	e,
	)

	# ---------------------------------------------------------------------------
	# Custom CSS
	# ---------------------------------------------------------------------------
	CUSTOM_CSS = """
	/* Global */
	.gradio-container {
	max-width: 1200px !important;
	margin: 0 auto !important;
	font-family: 'Inter', -apple-system, BlinkMacSystemFont, sans-serif !important;
	}

	/* Hero header */
	.hero-section {
	background: linear-gradient(135deg, #0f172a 0%, #1e293b 50%, #0f172a 100%);
	border: 1px solid #334155;
	border-radius: 16px;
	padding: 40px 48px;
	margin-bottom: 24px;
	position: relative;
	overflow: hidden;
	}
	.hero-section::before {
	content: '';
	position: absolute;
	top: 0;
	left: 0;
	right: 0;
	bottom: 0;
	background: radial-gradient(ellipse at 20% 50%, rgba(59, 130, 246, 0.08) 0%, transparent 60%),
	radial-gradient(ellipse at 80% 50%, rgba(139, 92, 246, 0.06) 0%, transparent 60%);
	pointer-events: none;
	}
	.hero-title {
	font-size: 2.2rem !important;
	font-weight: 700 !important;
	color: #f1f5f9 !important;
	margin: 0 0 8px 0 !important;
	letter-spacing: -0.02em;
	}
	.hero-subtitle {
	font-size: 1.05rem !important;
	color: #94a3b8 !important;
	margin: 0 0 20px 0 !important;
	line-height: 1.6;
	}
	.hero-badges {
	display: flex;
	gap: 12px;
	flex-wrap: wrap;
	}
	.hero-badge {
	display: inline-flex;
	align-items: center;
	gap: 6px;
	background: rgba(255, 255, 255, 0.06);
	border: 1px solid rgba(255, 255, 255, 0.1);
	border-radius: 20px;
	padding: 6px 14px;
	font-size: 0.82rem;
	color: #cbd5e1;
	}

	/* Stats bar */
	.stats-row {
	display: flex;
	gap: 16px;
	margin-bottom: 20px;
	}
	.stat-card {
	flex: 1;
	background: #1e293b;
	border: 1px solid #334155;
	border-radius: 12px;
	padding: 20px 24px;
	text-align: center;
	}
	.stat-number {
	font-size: 1.8rem;
	font-weight: 700;
	color: #60a5fa;
	line-height: 1;
	margin-bottom: 4px;
	}
	.stat-label {
	font-size: 0.8rem;
	color: #94a3b8;
	text-transform: uppercase;
	letter-spacing: 0.05em;
	}

	/* Tabs */
	.tabs {
	border: none !important;
	}
	button.tab-nav {
	font-weight: 600 !important;
	font-size: 0.95rem !important;
	padding: 12px 24px !important;
	}

	/* Input areas */
	textarea {
	border-radius: 10px !important;
	border: 1px solid #334155 !important;
	font-size: 0.95rem !important;
	line-height: 1.6 !important;
	}
	textarea:focus {
	border-color: #3b82f6 !important;
	box-shadow: 0 0 0 3px rgba(59, 130, 246, 0.15) !important;
	}

	/* Buttons */
	.primary-btn {
	border-radius: 10px !important;
	font-weight: 600 !important;
	font-size: 0.95rem !important;
	padding: 12px 32px !important;
	background: linear-gradient(135deg, #3b82f6 0%, #2563eb 100%) !important;
	border: none !important;
	transition: all 0.2s ease !important;
	}
	.primary-btn:hover {
	transform: translateY(-1px) !important;
	box-shadow: 0 4px 12px rgba(59, 130, 246, 0.3) !important;
	}

	/* Code output */
	.code-output {
	border-radius: 12px !important;
	border: 1px solid #334155 !important;
	}

	/* Examples */
	.examples-table {
	border-radius: 10px !important;
	overflow: hidden;
	}

	/* Model info banner */
	.model-banner {
	background: linear-gradient(135deg, rgba(52, 211, 153, 0.1) 0%, rgba(59, 130, 246, 0.1) 100%);
	border: 1px solid rgba(52, 211, 153, 0.3);
	border-radius: 12px;
	padding: 14px 20px;
	margin-bottom: 20px;
	display: flex;
	align-items: center;
	gap: 10px;
	font-size: 0.9rem;
	color: #94a3b8;
	}
	.model-banner strong {
	color: #34d399;
	}
	.model-banner .fallback {
	color: #fbbf24;
	}

	/* Section headers */
	.section-header {
	font-size: 1.1rem !important;
	font-weight: 600 !important;
	color: #e2e8f0 !important;
	margin-bottom: 8px !important;
	}
	.section-desc {
	font-size: 0.9rem !important;
	color: #94a3b8 !important;
	margin-bottom: 16px !important;
	}

	/* About page cards */
	.about-card {
	background: #1e293b;
	border: 1px solid #334155;
	border-radius: 12px;
	padding: 24px;
	margin-bottom: 16px;
	}

	/* Footer */
	.footer {
	text-align: center;
	padding: 24px;
	margin-top: 32px;
	border-top: 1px solid #1e293b;
	color: #64748b;
	font-size: 0.85rem;
	}
	.footer a {
	color: #60a5fa;
	text-decoration: none;
	}

	.status-card {
	border: 1px solid #334155;
	background: rgba(15, 23, 42, 0.6);
	border-radius: 10px;
	padding: 8px 12px;
	}

	#table-controls .wrap {
	align-items: end;
	}

	/* Mobile */
	@media (max-width: 900px) {
	.hero-section {
	padding: 28px 20px;
	}
	.hero-title {
	font-size: 1.75rem !important;
	}
	.stats-row {
	flex-wrap: wrap;
	}
	.stat-card {
	min-width: calc(50% - 8px);
	}
	}

	@media (max-width: 560px) {
	.stat-card {
	min-width: 100%;
	}
	.hero-badges {
	gap: 8px;
	}
	.primary-btn {
	width: 100% !important;
	}
	#table-controls .wrap {
	gap: 8px !important;
	}
	}
	"""

	# ---------------------------------------------------------------------------
	# Examples
	# ---------------------------------------------------------------------------
	EXAMPLES_CLASSIFY = [
	["A hospital employee lost their unencrypted laptop containing patient records while traveling. The device was left in a taxi and never recovered."],
	["Russian organized crime group used stolen credentials to access the company's web application and exfiltrated 50,000 customer credit card numbers over several weeks."],
	["An employee emailed a spreadsheet containing salary information for all staff to their personal Gmail account, violating company data handling policy."],
	["Attackers sent phishing emails to the finance department. One employee clicked the link and entered credentials on a fake login page. The attackers then used those credentials to initiate wire transfers totaling $2.3 million."],
	["A ransomware attack encrypted all file servers after an employee opened a malicious email attachment. The company was unable to access critical systems for 5 days."],
	["During a routine office move, several boxes of paper documents containing customer Social Security numbers were accidentally left at the old building and found by the new tenant."],
	]

	EXAMPLES_QA = [
	["What is the difference between hacking and misuse in VERIS?"],
	["How do I classify a phishing attack that led to ransomware?"],
	["What are the three actor types in VERIS?"],
	["When should I mark data_disclosure as 'Potentially' vs 'Yes'?"],
	["What is the A4 Grid and how is it used?"],
	["How does VERIS handle incidents with multiple threat actors?"],
	]


	# ---------------------------------------------------------------------------
	# Inference functions
	# ---------------------------------------------------------------------------
	ZEROGPU_QUEUE_HINT = "No GPU was available after"
	SPACES_PAGE_URL = "https://huggingface.co/spaces/vibesecurityguy/veris-classifier"
	SPACE_HOST_URL = "https://vibesecurityguy-veris-classifier.hf.space"
	ZEROGPU_RETRY_ATTEMPTS = 2
	ZEROGPU_RETRY_DELAY_SECONDS = 3


	def _is_zerogpu_queue_timeout(err: Exception) -> bool:
	"""Detect ZeroGPU queue timeout errors from the spaces runtime."""
	return ZEROGPU_QUEUE_HINT in str(err)


	def _spaces_user_logged_in(
	request: gr.Request \| None,
	profile: gr.OAuthProfile \| None = None,
	) -> bool:
	"""True when a Spaces OAuth user is attached to this request."""
	if profile is not None:
	return True
	if request is None:
	return False
	if getattr(request, "username", None):
	return True
	# Gradio/HF OAuth stores profile info in session; use it as fallback signal.
	session = getattr(request, "session", None)
	if isinstance(session, dict) and session.get("oauth_info"):
	return True
	return False


	def _session_status_markdown(
	request: gr.Request \| None = None,
	profile: gr.OAuthProfile \| None = None,
	) -> str:
	"""Render current Spaces auth status for the user."""
	if not IS_SPACES:
	return ""

	if _spaces_user_logged_in(request, profile):
	username = None
	if profile is not None:
	username = (
	getattr(profile, "preferred_username", None)
	or getattr(profile, "name", None)
	)
	if not username and request is not None:
	username = getattr(request, "username", None)
	if username:
	return (
	f"Session status: Logged in as `{username}`. "
	"ZeroGPU requests will use your account quota."
	)
	return "Session status: Logged in. ZeroGPU requests will use your account quota."

	return (
	"Session status: Not logged in. Click sign in to attach this browser session "
	"to your Hugging Face quota."
	)


	def _run_with_zerogpu_retry(call):
	"""Retry queue-timeout failures once before returning an error."""
	last_error = None
	for attempt in range(1, ZEROGPU_RETRY_ATTEMPTS + 1):
	try:
	return call()
	except Exception as e:
	last_error = e
	if _is_zerogpu_queue_timeout(e) and attempt < ZEROGPU_RETRY_ATTEMPTS:
	logger.warning(
	"ZeroGPU queue timeout (attempt %d/%d). Retrying in %ss.",
	attempt,
	ZEROGPU_RETRY_ATTEMPTS,
	ZEROGPU_RETRY_DELAY_SECONDS,
	)
	time.sleep(ZEROGPU_RETRY_DELAY_SECONDS)
	continue
	raise
	raise last_error



	def _use_hf_model() -> bool:
	"""Check if we should use the fine-tuned HF model."""
	# On HF Spaces, always try the local model first
	if IS_SPACES:
	return True
	# Locally, use HF model if VERIS_USE_HF is set
	return os.getenv("VERIS_USE_HF", "").lower() in ("1", "true", "yes")


	def classify(
	description: str,
	api_key: str,
	request: gr.Request \| None = None,
	profile: gr.OAuthProfile \| None = None,
	) -> str:
	"""Classify an incident — uses HF model on Spaces, OpenAI otherwise."""
	if not description.strip():
	return json.dumps({"error": "Please enter an incident description."}, indent=2)
	if IS_SPACES and not _spaces_user_logged_in(request, profile):
	return json.dumps(
	{
	"error": (
	"Please log in on Hugging Face and open this app from "
	f"{SPACES_PAGE_URL}. ZeroGPU quota is per logged-in user."
	)
	},
	indent=2,
	)

	use_hf = _use_hf_model()

	# Local-only override: allow OpenAI fallback when running outside Spaces.
	if api_key.strip() and not IS_SPACES:
	use_hf = False

	if use_hf:
	try:
	result = _run_with_zerogpu_retry(lambda: _classify_gpu(description))
	return json.dumps(result, indent=2)
	except Exception as e:
	logger.error(f"HF model error: {e}")
	if _is_zerogpu_queue_timeout(e):
	return json.dumps(
	{"error": "ZeroGPU queue is full right now. Try again in 1-2 minutes."},
	indent=2,
	)
	if IS_SPACES:
	return json.dumps({"error": f"Model inference failed: {str(e)}"}, indent=2)
	# Local fallback path only.
	key = os.getenv("OPENAI_API_KEY", "")
	if not key:
	return json.dumps({"error": f"Model inference failed: {str(e)}"}, indent=2)
	else:
	key = api_key.strip() or os.getenv("OPENAI_API_KEY", "")
	if not key:
	return json.dumps({"error": "Please provide an OpenAI API key or wait for the model to load."}, indent=2)

	# OpenAI fallback
	try:
	from openai import OpenAI
	client = OpenAI(api_key=key)
	result = classify_incident(client=client, description=description)
	return json.dumps(result, indent=2)
	except Exception as e:
	return json.dumps({"error": str(e)}, indent=2)


	def ask(
	question: str,
	api_key: str,
	request: gr.Request \| None = None,
	profile: gr.OAuthProfile \| None = None,
	) -> str:
	"""Answer a VERIS question — uses HF model on Spaces, OpenAI otherwise."""
	if not question.strip():
	return "Please enter a question."
	if IS_SPACES and not _spaces_user_logged_in(request, profile):
	return (
	"Error: Please log in on Hugging Face and open this app from "
	f"{SPACES_PAGE_URL}. ZeroGPU quota is per logged-in user."
	)

	use_hf = _use_hf_model()

	if api_key.strip() and not IS_SPACES:
	use_hf = False

	if use_hf:
	try:
	return _run_with_zerogpu_retry(lambda: _ask_gpu(question))
	except Exception as e:
	logger.error(f"HF model error: {e}")
	if _is_zerogpu_queue_timeout(e):
	return "Error: ZeroGPU queue is full right now. Try again in 1-2 minutes."
	if IS_SPACES:
	return f"Error: Model inference failed: {str(e)}"
	# Local fallback path only.
	key = os.getenv("OPENAI_API_KEY", "")
	if not key:
	return f"Error: Model inference failed: {str(e)}"
	else:
	key = api_key.strip() or os.getenv("OPENAI_API_KEY", "")
	if not key:
	return "Please provide an OpenAI API key or wait for the model to load."

	# OpenAI fallback
	try:
	from openai import OpenAI
	client = OpenAI(api_key=key)
	return answer_question(client=client, question=question)
	except Exception as e:
	return f"Error: {str(e)}"


	def _dimension_from_path(path: str) -> str:
	root = path.split(".", 1)[0].split("[", 1)[0]
	return root.title() if root else "General"


	def _flatten_for_table(value: Any, path: str, rows: list[list[str]]) -> None:
	"""Flatten nested VERIS JSON into table rows."""
	if isinstance(value, dict):
	if not value:
	rows.append([_dimension_from_path(path), path or "root", "{}"])
	return
	for key, subvalue in value.items():
	subpath = f"{path}.{key}" if path else key
	_flatten_for_table(subvalue, subpath, rows)
	return

	if isinstance(value, list):
	if not value:
	rows.append([_dimension_from_path(path), path or "root", "[]"])
	return
	# Keep scalar lists compact in one row.
	if all(not isinstance(item, (dict, list)) for item in value):
	rows.append([_dimension_from_path(path), path or "root", ", ".join(map(str, value))])
	return
	for i, subvalue in enumerate(value):
	_flatten_for_table(subvalue, f"{path}[{i}]", rows)
	return

	rows.append([_dimension_from_path(path), path or "root", str(value)])


	def _classification_rows_from_json(raw_json: str) -> list[list[str]]:
	"""Build table rows from classifier JSON output string."""
	if not raw_json.strip():
	return []
	try:
	parsed = json.loads(raw_json)
	except Exception:
	return [["Error", "raw_output", raw_json]]

	rows: list[list[str]] = []
	_flatten_for_table(parsed, "", rows)
	return rows


	def _validation_summary_markdown(raw_json: str) -> str:
	"""Build validation summary for the classification output."""
	try:
	parsed = json.loads(raw_json)
	except Exception:
	return ""

	if not isinstance(parsed, dict) or parsed.get("error"):
	return "Validation: Skipped."

	result = validate_classification(parsed)
	lines = [f"Validation: {'Passed' if result.valid else 'Issues found'}"]
	if result.errors:
	lines.append("Errors")
	lines.extend(f"- {err}" for err in result.errors[:8])
	if len(result.errors) > 8:
	lines.append(f"- ... {len(result.errors) - 8} more")
	if result.warnings:
	lines.append("Warnings")
	lines.extend(f"- {warn}" for warn in result.warnings[:8])
	if len(result.warnings) > 8:
	lines.append(f"- ... {len(result.warnings) - 8} more")
	return "\n".join(lines)


	def _filter_classification_rows(
	rows: list[list[str]],
	dimension_filter: str,
	errors_only: bool,
	) -> list[list[str]]:
	"""Filter table rows by dimension and optionally error-only rows."""
	filtered: list[list[str]] = []
	for row in rows:
	if len(row) != 3:
	continue
	dimension, field, value = row

	if dimension_filter != "All" and dimension != dimension_filter:
	continue

	if errors_only:
	blob = f"{dimension} {field} {value}".lower()
	if "error" not in blob:
	continue

	filtered.append(row)
	return filtered


	def _render_classification_output(
	raw_json: str,
	output_format: str,
	all_rows: list[list[str]],
	dimension_filter: str,
	errors_only: bool,
	):
	"""Render classification as JSON code or filtered table."""
	filtered_rows = _filter_classification_rows(all_rows, dimension_filter, errors_only)
	show_table = output_format == "Table"

	if show_table:
	return (
	gr.update(value=raw_json, visible=False),
	gr.update(value=filtered_rows, visible=True),
	gr.update(visible=True),
	gr.update(visible=True, interactive=bool(filtered_rows)),
	)

	return (
	gr.update(value=raw_json, visible=True),
	gr.update(value=[], visible=False),
	gr.update(visible=False),
	gr.update(visible=False, interactive=False),
	)


	def _apply_table_filters(
	all_rows: list[list[str]],
	dimension_filter: str,
	errors_only: bool,
	):
	"""Apply table-only filters without re-running inference."""
	filtered_rows = _filter_classification_rows(all_rows, dimension_filter, errors_only)
	return (
	gr.update(value=filtered_rows),
	gr.update(interactive=bool(filtered_rows)),
	)


	def _build_filtered_csv(
	all_rows: list[list[str]],
	dimension_filter: str,
	errors_only: bool,
	):
	"""Create downloadable CSV file for filtered rows."""
	filtered_rows = _filter_classification_rows(all_rows, dimension_filter, errors_only)
	if not filtered_rows:
	return gr.update(value=None, visible=False)

	with tempfile.NamedTemporaryFile(
	mode="w",
	suffix=".csv",
	delete=False,
	newline="",
	encoding="utf-8",
	) as tmp:
	writer = csv.writer(tmp)
	writer.writerow(["Dimension", "Field", "Value"])
	writer.writerows(filtered_rows)
	csv_path = tmp.name

	return gr.update(value=csv_path, visible=True)


	def classify_and_render(
	description: str,
	api_key: str,
	output_format: str,
	dimension_filter: str,
	errors_only: bool,
	request: gr.Request \| None = None,
	profile: gr.OAuthProfile \| None = None,
	):
	"""Run classification and return display-ready outputs."""
	raw_json = classify(description, api_key, request=request, profile=profile)
	all_rows = _classification_rows_from_json(raw_json)
	validation_md = _validation_summary_markdown(raw_json)
	code_update, table_update, controls_update, export_btn_update = _render_classification_output(
	raw_json,
	output_format,
	all_rows,
	dimension_filter,
	errors_only,
	)
	return (
	raw_json,
	all_rows,
	validation_md,
	code_update,
	table_update,
	controls_update,
	export_btn_update,
	gr.update(value=None, visible=False),
	)


	# ---------------------------------------------------------------------------
	# GPU-decorated functions for ZeroGPU
	# ---------------------------------------------------------------------------

	def _gpu_wrapper(duration: int):
	"""Use HF ZeroGPU decorator when available; otherwise no-op."""

	def passthrough(fn):
	return fn

	if IS_SPACES and spaces is not None and hasattr(spaces, "GPU"):
	return spaces.GPU(duration=duration)
	return passthrough


	if IS_SPACES:
	@_gpu_wrapper(duration=120)
	def _classify_gpu(description: str) -> dict:
	"""Classify incident using the fine-tuned model on ZeroGPU."""
	return classify_incident(description=description, use_hf=True)

	@_gpu_wrapper(duration=120)
	def _ask_gpu(question: str) -> str:
	"""Answer question using the fine-tuned model on ZeroGPU."""
	return answer_question(question=question, use_hf=True)
	else:
	def _classify_gpu(description: str) -> dict:
	"""Classify incident using the fine-tuned model locally."""
	return classify_incident(description=description, use_hf=True)

	def _ask_gpu(question: str) -> str:
	"""Answer question using the fine-tuned model locally."""
	return answer_question(question=question, use_hf=True)


	# ---------------------------------------------------------------------------
	# App
	# ---------------------------------------------------------------------------
	THEME = gr.themes.Base(
	primary_hue=gr.themes.colors.blue,
	secondary_hue=gr.themes.colors.slate,
	neutral_hue=gr.themes.colors.slate,
	font=gr.themes.GoogleFont("Inter"),
	).set(
	body_background_fill="#0f172a",
	body_background_fill_dark="#0f172a",
	block_background_fill="#1e293b",
	block_background_fill_dark="#1e293b",
	block_border_color="#334155",
	block_border_color_dark="#334155",
	block_label_text_color="#e2e8f0",
	block_label_text_color_dark="#e2e8f0",
	block_title_text_color="#f1f5f9",
	block_title_text_color_dark="#f1f5f9",
	body_text_color="#e2e8f0",
	body_text_color_dark="#e2e8f0",
	body_text_color_subdued="#94a3b8",
	body_text_color_subdued_dark="#94a3b8",
	input_background_fill="#0f172a",
	input_background_fill_dark="#0f172a",
	input_border_color="#334155",
	input_border_color_dark="#334155",
	input_placeholder_color="#64748b",
	input_placeholder_color_dark="#64748b",
	border_color_primary="#3b82f6",
	border_color_primary_dark="#3b82f6",
	button_primary_background_fill="linear-gradient(135deg, #3b82f6 0%, #2563eb 100%)",
	button_primary_background_fill_dark="linear-gradient(135deg, #3b82f6 0%, #2563eb 100%)",
	button_primary_text_color="#ffffff",
	button_primary_text_color_dark="#ffffff",
	shadow_spread="0px",
	)


	def build_app() -> gr.Blocks:
	with gr.Blocks(
	title="VERIS Incident Classifier",
	theme=THEME,
	css=CUSTOM_CSS,
	) as app:
	session_status = None

	# --- Hero Header ---
	gr.HTML("""
	<div class="hero-section">
	<div style="position: relative; z-index: 1;">
	<div class="hero-title">VERIS Incident Classifier</div>
	<div class="hero-subtitle">
	Transform security incident reports into structured
	<a href="https://verisframework.org/" target="_blank" style="color: #60a5fa; text-decoration: none;">VERIS</a>
	classifications using a fine-tuned AI model. No API key required.
	</div>
	<div class="hero-badges">
	<span class="hero-badge">
	<svg width="14" height="14" viewBox="0 0 24 24" fill="none" stroke="#60a5fa" stroke-width="2"><path d="M12 2L2 7l10 5 10-5-10-5zM2 17l10 5 10-5M2 12l10 5 10-5"/></svg>
	Fine-tuned Mistral-7B
	</span>
	<span class="hero-badge">
	<svg width="14" height="14" viewBox="0 0 24 24" fill="none" stroke="#a78bfa" stroke-width="2"><circle cx="12" cy="12" r="10"/><path d="M12 6v6l4 2"/></svg>
	10,000+ Real Incidents
	</span>
	<span class="hero-badge">
	<svg width="14" height="14" viewBox="0 0 24 24" fill="none" stroke="#34d399" stroke-width="2"><path d="M9 12l2 2 4-4m6 2a9 9 0 11-18 0 9 9 0 0118 0z"/></svg>
	VCDB + QLoRA
	</span>
	</div>
	</div>
	</div>
	""")

	# --- Stats Bar ---
	gr.HTML("""
	<div class="stats-row">
	<div class="stat-card">
	<div class="stat-number">4</div>
	<div class="stat-label">Dimensions</div>
	</div>
	<div class="stat-card">
	<div class="stat-number">315</div>
	<div class="stat-label">A4 Grid Combos</div>
	</div>
	<div class="stat-card">
	<div class="stat-number">10K+</div>
	<div class="stat-label">Trained Incidents</div>
	</div>
	<div class="stat-card">
	<div class="stat-number">300+</div>
	<div class="stat-label">Enum Values</div>
	</div>
	</div>
	""")

	# --- Model Info Banner ---
	if IS_SPACES:
	gr.HTML("""
	<div class="model-banner">
	<svg width="18" height="18" viewBox="0 0 24 24" fill="none" stroke="#34d399" stroke-width="2">
	<path d="M22 11.08V12a10 10 0 1 1-5.93-9.14"/>
	<polyline points="22 4 12 14.01 9 11.01"/>
	</svg>
	<span>
	<strong>Model:</strong> Fine-tuned
	<a href="https://huggingface.co/vibesecurityguy/veris-classifier-v2" target="_blank" style="color: #34d399;">Mistral-7B-Instruct</a>
	on ZeroGPU — no API key needed!
	</span>
	</div>
	""")
	with gr.Row():
	gr.Markdown(
	"Required: Log in with Hugging Face so ZeroGPU usage "
	"counts against your account quota."
	)
	login_btn = gr.LoginButton("Sign in with Hugging Face")
	# Gradio 4.44 can miss auto-activation in some Spaces contexts.
	login_btn.activate()
	gr.HTML(
	f'<a href="{SPACE_HOST_URL}/login/huggingface" target="_top" '
	'style="display:inline-block;padding:10px 14px;border-radius:8px;'
	'border:1px solid #334155;color:#cbd5e1;text-decoration:none;font-weight:600;">'
	"Direct sign-in (if button refreshes)</a>"
	)
	session_status = gr.Markdown(
	value="Session status: Checking...",
	elem_classes=["status-card"],
	)
	else:
	gr.HTML("""
	<div class="model-banner">
	<svg width="18" height="18" viewBox="0 0 24 24" fill="none" stroke="#fbbf24" stroke-width="2">
	<circle cx="12" cy="12" r="10"/>
	<line x1="12" y1="8" x2="12" y2="12"/>
	<line x1="12" y1="16" x2="12.01" y2="16"/>
	</svg>
	<span class="fallback">
	<strong>Local Mode:</strong> Set <code>VERIS_USE_HF=true</code> to use the
	fine-tuned model locally (requires GPU), or provide an OpenAI API key below.
	</span>
	</div>
	""")

	# --- API Key (local mode only) ---
	if IS_SPACES:
	api_key = gr.State("")
	else:
	with gr.Group():
	api_key = gr.Textbox(
	label="OpenAI API Key",
	placeholder="sk-... (required for OpenAI fallback)",
	type="password",
	info="Your key is never stored.",
	)

	# --- Main Tabs ---
	with gr.Tabs():

	# ---- TAB 1: Classify ----
	with gr.TabItem("Classify Incident", id="classify"):
	gr.HTML('<div class="section-header">Incident Classification</div>')
	gr.HTML('<div class="section-desc">Describe a security incident in plain English. The classifier will map it to the VERIS taxonomy across actors, actions, assets, and attributes.</div>')

	with gr.Row(equal_height=True):
	with gr.Column(scale=1):
	incident_input = gr.Textbox(
	label="Incident Description",
	placeholder="e.g., An attacker used stolen credentials to log into our web portal and download customer records containing names, emails, and credit card numbers...",
	lines=8,
	max_lines=15,
	)
	classify_btn = gr.Button(
	"Classify Incident",
	variant="primary",
	size="lg",
	elem_classes=["primary-btn"],
	)

	with gr.Column(scale=1):
	output_format = gr.Radio(
	choices=["JSON", "Table"],
	value="JSON",
	label="Output Format",
	info="Switch between raw JSON and a flattened table view.",
	)
	last_classification_raw = gr.State("")
	classification_rows = gr.State([])
	validation_output = gr.Markdown(
	label="Validation",
	value="Validation summary will appear after classification.",
	)
	classification_output = gr.Code(
	label="VERIS Classification (JSON)",
	language="json",
	lines=20,
	elem_classes=["code-output"],
	)
	with gr.Row(visible=False, elem_id="table-controls") as table_controls:
	dimension_filter = gr.Dropdown(
	choices=["All", "Actor", "Action", "Asset", "Attribute", "Error", "General"],
	value="All",
	label="Filter Dimension",
	)
	errors_only = gr.Checkbox(
	value=False,
	label="Errors Only",
	)
	export_csv_btn = gr.Button(
	"Generate CSV",
	size="sm",
	interactive=False,
	visible=False,
	)
	csv_file = gr.File(
	label="Download Filtered CSV",
	visible=False,
	interactive=False,
	)
	classification_table = gr.Dataframe(
	headers=["Dimension", "Field", "Value"],
	datatype=["str", "str", "str"],
	row_count=(0, "dynamic"),
	col_count=(3, "fixed"),
	visible=False,
	interactive=False,
	wrap=True,
	max_height=500,
	label="VERIS Classification (Table)",
	)

	gr.HTML('<div style="margin-top: 20px;"><div class="section-header">Try an Example</div></div>')
	gr.Examples(
	examples=EXAMPLES_CLASSIFY,
	inputs=incident_input,
	label="",
	examples_per_page=6,
	)

	classify_btn.click(
	fn=classify_and_render,
	inputs=[incident_input, api_key, output_format, dimension_filter, errors_only],
	outputs=[
	last_classification_raw,
	classification_rows,
	validation_output,
	classification_output,
	classification_table,
	table_controls,
	export_csv_btn,
	csv_file,
	],
	)
	output_format.change(
	fn=_render_classification_output,
	inputs=[
	last_classification_raw,
	output_format,
	classification_rows,
	dimension_filter,
	errors_only,
	],
	outputs=[classification_output, classification_table, table_controls, export_csv_btn],
	)
	dimension_filter.change(
	fn=_apply_table_filters,
	inputs=[classification_rows, dimension_filter, errors_only],
	outputs=[classification_table, export_csv_btn],
	)
	errors_only.change(
	fn=_apply_table_filters,
	inputs=[classification_rows, dimension_filter, errors_only],
	outputs=[classification_table, export_csv_btn],
	)
	export_csv_btn.click(
	fn=_build_filtered_csv,
	inputs=[classification_rows, dimension_filter, errors_only],
	outputs=[csv_file],
	)

	# ---- TAB 2: Q&A ----
	with gr.TabItem("Ask About VERIS", id="qa"):
	gr.HTML('<div class="section-header">VERIS Knowledge Base</div>')
	gr.HTML('<div class="section-desc">Ask anything about the VERIS framework — taxonomy, enumerations, classification guidance, the A4 Grid, or how specific incident types should be categorized.</div>')

	with gr.Row(equal_height=True):
	with gr.Column(scale=1):
	question_input = gr.Textbox(
	label="Your Question",
	placeholder="e.g., What's the difference between hacking and misuse in VERIS?",
	lines=4,
	max_lines=8,
	)
	ask_btn = gr.Button(
	"Ask Question",
	variant="primary",
	size="lg",
	elem_classes=["primary-btn"],
	)

	with gr.Column(scale=1):
	answer_output = gr.Markdown(
	label="Answer",
	value="Your answer will appear here...",
	)

	gr.HTML('<div style="margin-top: 20px;"><div class="section-header">Common Questions</div></div>')
	gr.Examples(
	examples=EXAMPLES_QA,
	inputs=question_input,
	label="",
	examples_per_page=6,
	)

	ask_btn.click(
	fn=ask,
	inputs=[question_input, api_key],
	outputs=answer_output,
	)

	# ---- TAB 3: About ----
	with gr.TabItem("About", id="about"):
	gr.HTML("""
	<div class="about-card">
	<h3 style="color: #f1f5f9; margin-top: 0;">What is VERIS?</h3>
	<p style="color: #94a3b8; line-height: 1.7;">
	<strong style="color: #e2e8f0;">VERIS</strong> (Vocabulary for Event Recording and Incident Sharing)
	is a structured taxonomy for describing security incidents, developed by the Verizon RISK Team.
	It powers the annual <a href="https://www.verizon.com/business/resources/reports/dbir/" target="_blank" style="color: #60a5fa;">Verizon DBIR</a>
	and provides a common language for the security community to share and analyze incident data.
	</p>
	</div>

	<div class="about-card">
	<h3 style="color: #f1f5f9; margin-top: 0;">The 4 A's Framework</h3>
	<table style="width: 100%; border-collapse: collapse; margin-top: 12px;">
	<thead>
	<tr style="border-bottom: 1px solid #334155;">
	<th style="text-align: left; padding: 10px 16px; color: #60a5fa; font-size: 0.85rem; text-transform: uppercase; letter-spacing: 0.05em;">Dimension</th>
	<th style="text-align: left; padding: 10px 16px; color: #60a5fa; font-size: 0.85rem; text-transform: uppercase; letter-spacing: 0.05em;">Categories</th>
	<th style="text-align: left; padding: 10px 16px; color: #60a5fa; font-size: 0.85rem; text-transform: uppercase; letter-spacing: 0.05em;">Question</th>
	</tr>
	</thead>
	<tbody>
	<tr style="border-bottom: 1px solid #1e293b;">
	<td style="padding: 12px 16px; color: #e2e8f0; font-weight: 600;">Actors</td>
	<td style="padding: 12px 16px; color: #94a3b8;">External, Internal, Partner</td>
	<td style="padding: 12px 16px; color: #94a3b8;">Who caused it?</td>
	</tr>
	<tr style="border-bottom: 1px solid #1e293b;">
	<td style="padding: 12px 16px; color: #e2e8f0; font-weight: 600;">Actions</td>
	<td style="padding: 12px 16px; color: #94a3b8;">Malware, Hacking, Social, Misuse, Physical, Error, Environmental</td>
	<td style="padding: 12px 16px; color: #94a3b8;">What did they do?</td>
	</tr>
	<tr style="border-bottom: 1px solid #1e293b;">
	<td style="padding: 12px 16px; color: #e2e8f0; font-weight: 600;">Assets</td>
	<td style="padding: 12px 16px; color: #94a3b8;">Server, Network, User Device, Terminal, Media, People</td>
	<td style="padding: 12px 16px; color: #94a3b8;">What was affected?</td>
	</tr>
	<tr>
	<td style="padding: 12px 16px; color: #e2e8f0; font-weight: 600;">Attributes</td>
	<td style="padding: 12px 16px; color: #94a3b8;">Confidentiality, Integrity, Availability</td>
	<td style="padding: 12px 16px; color: #94a3b8;">How was it affected?</td>
	</tr>
	</tbody>
	</table>
	</div>

	<div class="about-card">
	<h3 style="color: #f1f5f9; margin-top: 0;">About This Project</h3>
	<p style="color: #94a3b8; line-height: 1.7;">
	This classifier uses a <strong style="color: #e2e8f0;">fine-tuned Mistral-7B-Instruct</strong> model,
	trained on <strong style="color: #e2e8f0;">10,000+ real security incidents</strong> from the
	<a href="https://github.com/vz-risk/VCDB" target="_blank" style="color: #60a5fa;">VERIS Community Database (VCDB)</a>
	plus 300+ VERIS Q&A pairs. The model was fine-tuned using QLoRA (4-bit quantization)
	and runs for free on Hugging Face ZeroGPU.
	</p>
	<p style="color: #94a3b8; line-height: 1.7; margin-top: 10px;">
	<strong style="color: #e2e8f0;">Model clarity:</strong> Production inference is
	<strong style="color: #e2e8f0;">Mistral-only</strong> (base:
	<code>mistralai/Mistral-7B-Instruct-v0.3</code> + LoRA adapter
	<code>vibesecurityguy/veris-classifier-v2</code>). This app does not use Qwen.
	</p>
	<div style="display: flex; gap: 12px; margin-top: 16px; flex-wrap: wrap;">
	<a href="https://verisframework.org/" target="_blank" style="display: inline-flex; align-items: center; gap: 6px; background: rgba(59, 130, 246, 0.1); border: 1px solid rgba(59, 130, 246, 0.3); border-radius: 8px; padding: 8px 16px; color: #60a5fa; text-decoration: none; font-size: 0.9rem;">VERIS Framework</a>
	<a href="https://github.com/vz-risk/VCDB" target="_blank" style="display: inline-flex; align-items: center; gap: 6px; background: rgba(139, 92, 246, 0.1); border: 1px solid rgba(139, 92, 246, 0.3); border-radius: 8px; padding: 8px 16px; color: #a78bfa; text-decoration: none; font-size: 0.9rem;">VCDB GitHub</a>
	<a href="https://www.verizon.com/business/resources/reports/dbir/" target="_blank" style="display: inline-flex; align-items: center; gap: 6px; background: rgba(52, 211, 153, 0.1); border: 1px solid rgba(52, 211, 153, 0.3); border-radius: 8px; padding: 8px 16px; color: #34d399; text-decoration: none; font-size: 0.9rem;">Verizon DBIR</a>
	<a href="https://huggingface.co/vibesecurityguy/veris-classifier-v2" target="_blank" style="display: inline-flex; align-items: center; gap: 6px; background: rgba(251, 191, 36, 0.1); border: 1px solid rgba(251, 191, 36, 0.3); border-radius: 8px; padding: 8px 16px; color: #fbbf24; text-decoration: none; font-size: 0.9rem;">Model on HF</a>
	</div>
	</div>

	<div class="about-card">
	<h3 style="color: #f1f5f9; margin-top: 0;">Technical Details</h3>
	<table style="width: 100%; border-collapse: collapse; margin-top: 12px;">
	<tbody>
	<tr style="border-bottom: 1px solid #1e293b;">
	<td style="padding: 10px 16px; color: #94a3b8; width: 40%;">Base Model</td>
	<td style="padding: 10px 16px; color: #e2e8f0;">mistralai/Mistral-7B-Instruct-v0.3</td>
	</tr>
	<tr style="border-bottom: 1px solid #1e293b;">
	<td style="padding: 10px 16px; color: #94a3b8;">Fine-tuning Method</td>
	<td style="padding: 10px 16px; color: #e2e8f0;">QLoRA (4-bit, r=16, alpha=32)</td>
	</tr>
	<tr style="border-bottom: 1px solid #1e293b;">
	<td style="padding: 10px 16px; color: #94a3b8;">Training Data</td>
	<td style="padding: 10px 16px; color: #e2e8f0;">10,019 classification + 311 Q&A pairs</td>
	</tr>
	<tr style="border-bottom: 1px solid #1e293b;">
	<td style="padding: 10px 16px; color: #94a3b8;">Training Epochs</td>
	<td style="padding: 10px 16px; color: #e2e8f0;">3</td>
	</tr>
	<tr style="border-bottom: 1px solid #1e293b;">
	<td style="padding: 10px 16px; color: #94a3b8;">Effective Batch Size</td>
	<td style="padding: 10px 16px; color: #e2e8f0;">8 (2 x 4 gradient accumulation)</td>
	</tr>
	<tr>
	<td style="padding: 10px 16px; color: #94a3b8;">Inference</td>
	<td style="padding: 10px 16px; color: #e2e8f0;">HF ZeroGPU (free A10G burst)</td>
	</tr>
	</tbody>
	</table>
	</div>
	""")

	# --- Footer ---
	gr.HTML("""
	<div class="footer">
	Fine-tuned Mistral-7B-Instruct · VERIS Framework · VCDB · QLoRA
	<br>
	<a href="https://github.com/petershamoon/veris-classifier">Source Code</a> ·
	<a href="https://huggingface.co/vibesecurityguy/veris-classifier-v2">Model</a> ·
	<a href="https://verisframework.org/">VERIS Docs</a> ·
	<a href="https://github.com/vz-risk/VCDB">VCDB</a>
	</div>
	""")

	if IS_SPACES and session_status is not None:
	app.load(
	fn=_session_status_markdown,
	outputs=[session_status],
	queue=False,
	)

	return app


	if __name__ == "__main__":
	app = build_app()
	app.launch()