Spaces:

build-small-hackathon
/

TurboSkillSlug

Sleeping

App Files Files Community

TurboSkillSlug / model_guard.py

legendarydragontamer

deploy

51a9974 18 days ago

Raw

History Blame Contribute Delete

3.09 kB

	"""
	Compliance guard: makes it impossible to call an over-32B model from the live app path.

	Build Small REQ-01: every model the app depends on must be < 32B total params.
	Frontier models (Opus, GPT-5.x, etc.) are fine in OFFLINE eval/research scripts, but
	must NEVER be on the deployed app's request path.

	Usage in app.py (or any module that runs inside the live Space):
	from model_guard import assert_small_model, APP_RUNTIME
	APP_RUNTIME.enable() # call once at app startup
	assert_small_model(model_name) # call before any model invocation

	In offline research scripts, simply do NOT enable APP_RUNTIME, and frontier calls pass.

	The guard is allow-list based: only known sub-32B models are permitted in app runtime.
	Anything not on the allow-list (or matching a frontier pattern) raises immediately.
	"""

	from __future__ import annotations

	import os
	import re

	# Sub-32B models your APP is allowed to use at runtime. Extend as needed.
	ALLOWED_APP_MODELS = {
	"whisper", "whisper-large", "whisper-809m",
	"qwen2.5-1.5b", "qwen2.5-1.5b-instruct",
	"qwen2.5-7b", "qwen2.5-7b-instruct", # legit fallback + gotcha enrichment (7B < 32B)
	"slugvoice", "slugextract", # your LoRAs on the 1.5B base
	}

	# Patterns that are ALWAYS frontier / over-cap — blocked in app runtime.
	_FRONTIER_PATTERNS = [
	r"opus", r"sonnet", r"gpt-5", r"gpt-4", r"o1", r"o3", r"o4",
	r"claude-3", r"claude-4", r"claude-opus", r"claude-sonnet",
	r"\b\d{2,}b\b", # any "...70b", "...405b" style tag >= 2 digits of B
	r"gemini-1\.5-pro", r"gemini-2", r"deepseek-v", r"llama-3\.1-405b",
	]


	class _AppRuntime:
	"""Flag indicating we're inside the live app (not an offline research script)."""
	def __init__(self):
	self._on = os.environ.get("APP_RUNTIME", "") == "1"

	def enable(self):
	self._on = True

	def disable(self):
	self._on = False

	@property
	def active(self) -> bool:
	return self._on


	APP_RUNTIME = _AppRuntime()


	def _looks_frontier(model_name: str) -> bool:
	m = model_name.lower()
	return any(re.search(p, m) for p in _FRONTIER_PATTERNS)


	def assert_small_model(model_name: str) -> None:
	"""Raise if a frontier/over-cap model is used while the app runtime is active.
	No-op in offline research mode (APP_RUNTIME not enabled)."""
	if not APP_RUNTIME.active:
	return # offline eval/research — frontier calls are allowed here
	name = (model_name or "").strip().lower()
	base = name.split("/")[-1] # strip provider prefix like 'anthropic/'
	allowed = any(base.startswith(a) or a in base for a in ALLOWED_APP_MODELS)
	if _looks_frontier(name) or not allowed:
	raise RuntimeError(
	f"REQ-01 GUARD: refusing to call '{model_name}' from the live app path. "
	f"The deployed app may only use sub-32B models {sorted(ALLOWED_APP_MODELS)}. "
	f"Frontier models are allowed only in offline eval/research scripts "
	f"(do not call APP_RUNTIME.enable() there)."
	)