Spaces:

Patricksturg
/

silicon-sampling-dashboard

Running

App Files Files Community

silicon-sampling-dashboard / token_usage.py

Patricksturg

Increase run limit to 15 for Haonan Sun

bb8ee77 verified about 2 months ago

raw

history blame contribute delete

10.8 kB

	"""
	Per-token usage tracking for assignment tokens.

	Tracks how many runs each assignment token has used and enforces
	a maximum. A "run" = one user-triggered generation job (cognitive
	interview, expert review, QAS, or silicon sampling).

	Storage: JSON file, either local or backed by a HuggingFace dataset
	repo for persistence across HF Space restarts.

	Usage in dashboard.py — see integration instructions at bottom of file.
	"""

	import csv
	import hashlib
	import json
	import logging
	import os
	import threading
	from pathlib import Path

	logger = logging.getLogger(__name__)

	# ---------------------------------------------------------------------------
	# Configuration
	# ---------------------------------------------------------------------------

	MAX_RUNS_PER_TOKEN = 8

	# Per-token overrides (token -> max runs)
	_TOKEN_OVERRIDES = {
	"DE9BBFB5": 15, # Haonan Sun
	}


	def get_max_runs(token: str) -> int:
	"""Return the max runs for a token, checking overrides first."""
	return _TOKEN_OVERRIDES.get(token.strip(), MAX_RUNS_PER_TOKEN)

	# Path to the CSV that lists valid tokens (column: "token")
	_TOKEN_CSV_PATH = Path(__file__).parent / "student_tokens.csv"

	# Local JSON file for usage data
	_LOCAL_USAGE_PATH = Path(__file__).parent / "token_usage.json"

	# HuggingFace dataset repo for persistent storage (optional).
	# Set these environment variables on the HF Space to enable:
	# HF_USAGE_REPO = "Patricksturg/cogbot-token-usage" (a private dataset repo)
	# HF_USAGE_TOKEN = a write-access HF token
	_HF_USAGE_REPO = os.environ.get("HF_USAGE_REPO", "")
	_HF_USAGE_TOKEN = os.environ.get("HF_USAGE_TOKEN", "")
	_HF_USAGE_FILENAME = "token_usage.json"

	# Thread lock for safe concurrent access within one process
	_lock = threading.Lock()


	# ---------------------------------------------------------------------------
	# Token masking (for safe logging)
	# ---------------------------------------------------------------------------

	def mask_token(token: str) -> str:
	"""Return a short hash for logging. Never log raw tokens."""
	return hashlib.sha256(token.encode()).hexdigest()[:8]


	# ---------------------------------------------------------------------------
	# Valid token loading
	# ---------------------------------------------------------------------------

	_valid_tokens: set[str] \| None = None


	def _load_valid_tokens() -> set[str]:
	"""Load the set of valid assignment tokens from the CSV."""
	global _valid_tokens
	if _valid_tokens is not None:
	return _valid_tokens

	tokens = set()
	path = _TOKEN_CSV_PATH
	if path.exists():
	with open(path, newline="") as f:
	reader = csv.DictReader(f)
	for row in reader:
	t = row.get("token", "").strip()
	if t:
	tokens.add(t)
	logger.info(f"Loaded {len(tokens)} valid assignment tokens")
	else:
	logger.warning(f"Token CSV not found: {path}")

	_valid_tokens = tokens
	return _valid_tokens


	def is_valid_token(token: str) -> bool:
	"""Check whether a token is in the valid set."""
	return token.strip() in _load_valid_tokens()


	# ---------------------------------------------------------------------------
	# Usage persistence — local JSON
	# ---------------------------------------------------------------------------

	def _load_local() -> dict:
	if _LOCAL_USAGE_PATH.exists():
	try:
	with open(_LOCAL_USAGE_PATH) as f:
	return json.load(f)
	except (json.JSONDecodeError, OSError):
	logger.warning("Corrupt local usage file — starting fresh")
	return {}


	def _save_local(data: dict):
	with open(_LOCAL_USAGE_PATH, "w") as f:
	json.dump(data, f, indent=2)


	# ---------------------------------------------------------------------------
	# Usage persistence — HuggingFace dataset repo
	# ---------------------------------------------------------------------------

	def _hf_enabled() -> bool:
	return bool(_HF_USAGE_REPO and _HF_USAGE_TOKEN)


	def _load_hf() -> dict:
	"""Download token_usage.json from the HF dataset repo."""
	try:
	from huggingface_hub import hf_hub_download
	path = hf_hub_download(
	repo_id=_HF_USAGE_REPO,
	filename=_HF_USAGE_FILENAME,
	repo_type="dataset",
	token=_HF_USAGE_TOKEN,
	)
	with open(path) as f:
	return json.load(f)
	except Exception as e:
	logger.warning(f"Could not load usage from HF repo: {e}")
	return {}


	def _save_hf(data: dict):
	"""Upload token_usage.json to the HF dataset repo."""
	try:
	from huggingface_hub import HfApi
	import tempfile

	api = HfApi(token=_HF_USAGE_TOKEN)
	with tempfile.NamedTemporaryFile(
	mode="w", suffix=".json", delete=False
	) as tmp:
	json.dump(data, tmp, indent=2)
	tmp_path = tmp.name

	api.upload_file(
	path_or_fileobj=tmp_path,
	path_in_repo=_HF_USAGE_FILENAME,
	repo_id=_HF_USAGE_REPO,
	repo_type="dataset",
	commit_message="Update token usage",
	)
	os.unlink(tmp_path)
	except Exception as e:
	logger.error(f"Could not save usage to HF repo: {e}")


	# ---------------------------------------------------------------------------
	# Unified load / save (prefers HF if configured, falls back to local)
	# ---------------------------------------------------------------------------

	def load_token_usage() -> dict:
	"""Load usage data. Returns dict like {"TOKEN": {"runs_used": 3}, ...}."""
	if _hf_enabled():
	return _load_hf()
	return _load_local()


	def save_token_usage(data: dict):
	"""Persist usage data."""
	_save_local(data) # always write local copy
	if _hf_enabled():
	_save_hf(data) # also push to HF if configured


	# ---------------------------------------------------------------------------
	# Public API
	# ---------------------------------------------------------------------------

	def get_runs_used(token: str) -> int:
	"""Return how many runs this token has consumed."""
	with _lock:
	data = load_token_usage()
	return data.get(token, {}).get("runs_used", 0)


	def get_remaining_runs(token: str) -> int:
	"""Return how many runs this token has left."""
	return get_max_runs(token) - get_runs_used(token)


	def can_use_token(token: str) -> tuple[bool, str]:
	"""
	Validate a token and check its quota.

	Returns (ok, message):
	(True, "N runs remaining") — token is valid and has quota
	(False, reason) — token is invalid or exhausted
	"""
	token = token.strip()
	if not is_valid_token(token):
	return False, "Invalid assignment token."

	remaining = get_remaining_runs(token)
	if remaining <= 0:
	return False, (
	"You have reached the maximum number of runs allowed for this "
	"assignment token. If you encountered a technical problem, "
	"contact Patrick Sturgis."
	)
	return True, f"{remaining} runs remaining"


	def increment_token_usage(token: str):
	"""Increment the run count for a token. Persists immediately."""
	with _lock:
	data = load_token_usage()
	entry = data.setdefault(token, {"runs_used": 0})
	entry["runs_used"] += 1
	save_token_usage(data)
	logger.info(
	f"Token {mask_token(token)}: runs_used -> {entry['runs_used']}"
	)


	def rollback_token_usage(token: str):
	"""Decrement the run count (on early failure). Persists immediately."""
	with _lock:
	data = load_token_usage()
	entry = data.get(token)
	if entry and entry.get("runs_used", 0) > 0:
	entry["runs_used"] -= 1
	save_token_usage(data)
	logger.info(
	f"Token {mask_token(token)}: rollback -> {entry['runs_used']}"
	)


	def reset_token(token: str):
	"""Reset a token's usage to zero. For admin use."""
	with _lock:
	data = load_token_usage()
	data[token] = {"runs_used": 0}
	save_token_usage(data)


	def reset_all_tokens():
	"""Reset all token usage to zero. For admin use."""
	with _lock:
	save_token_usage({})


	# ---------------------------------------------------------------------------
	# Integration instructions for dashboard.py (HF version)
	# ---------------------------------------------------------------------------
	#
	# Below is the code to integrate into the HF Space dashboard.py.
	# The exact line numbers will differ — adapt to the live file.
	#
	# ── 1. IMPORT (top of file) ──────────────────────────────────────────────
	#
	# from token_usage import (
	# can_use_token, increment_token_usage, rollback_token_usage,
	# get_remaining_runs, is_valid_token, MAX_RUNS_PER_TOKEN,
	# )
	#
	# ── 2. SESSION STATE (near other session_state inits) ────────────────────
	#
	# if 'active_token' not in st.session_state:
	# st.session_state.active_token = None
	#
	# ── 3. UI: show remaining runs (after token input widget) ────────────────
	#
	# # Assuming assignment_token is the text_input value:
	# if assignment_token:
	# ok, msg = can_use_token(assignment_token)
	# if ok:
	# st.session_state.active_token = assignment_token
	# st.sidebar.info(f"✅ {msg}")
	# else:
	# st.session_state.active_token = None
	# st.sidebar.error(msg)
	#
	# ── 4. GATE: before the run starts (after button click, before sampler) ──
	#
	# # Inside the `if st.button(...)` block, before any API calls:
	# if st.session_state.active_token:
	# ok, msg = can_use_token(st.session_state.active_token)
	# if not ok:
	# st.error(msg)
	# st.session_state.processing = False
	# st.stop()
	# increment_token_usage(st.session_state.active_token)
	#
	# ── 5. ROLLBACK: in the except block for system errors ───────────────────
	#
	# except Exception as e:
	# if st.session_state.get('active_token'):
	# rollback_token_usage(st.session_state.active_token)
	# st.error(f"Error: {e}")
	# st.session_state.processing = False
	#
	# ── 6. DOUBLE-CLICK GUARD ────────────────────────────────────────────────
	#
	# The existing `st.session_state.processing` flag already prevents this:
	# the button is disabled while processing=True. No extra work needed.
	#