Spaces:

plexdx
/

gng

Sleeping

App Files Files Community

gng / gatekeeper.py

plexdx

Upload 21 files

f589dab verified 4 days ago

raw

history blame contribute delete

6.2 kB

	"""
	gatekeeper.py — Groq-powered fact vs. noise edge router.

	Design goal: sub-120ms p95 latency to filter social noise before the
	expensive RAG + multi-agent pipeline fires.

	The gatekeeper uses llama3-8b-8192 on Groq because:
	- 800+ tokens/sec throughput → deterministic latency budget
	- Structured JSON output schema enforced via Pydantic v2
	- Free tier handles high throughput for the gatekeeper role
	- Groq's hardware is optimized for small-model, low-latency inference
	"""

	from __future__ import annotations

	import os
	import re
	from enum import Enum
	from functools import lru_cache

	import structlog
	from groq import AsyncGroq
	from pydantic import BaseModel, Field
	from tenacity import retry, stop_after_attempt, wait_exponential

	log = structlog.get_logger(__name__)

	# ── Models ────────────────────────────────────────────────────────────────────
	class ClaimLabel(str, Enum):
	FACT = "fact"
	NOISE = "noise"


	class GatekeeperResult(BaseModel):
	label: ClaimLabel
	reason: str = Field(description="One-sentence explanation for the classification")
	falsifiability_score: float = Field(
	ge=0.0, le=1.0,
	description="0=pure opinion/meme, 1=objectively verifiable claim"
	)


	# ── Groq client ───────────────────────────────────────────────────────────────
	@lru_cache(maxsize=1)
	def get_groq_client() -> AsyncGroq:
	api_key = os.getenv("GROQ_API_KEY", "")
	if not api_key:
	log.warning("gatekeeper.no_api_key", msg="GROQ_API_KEY not set, using mock fallback")
	return AsyncGroq(api_key=api_key or "gsk_placeholder")


	GATEKEEPER_SYSTEM = """You are a claim falsifiability classifier. Your ONLY job is to decide whether a given piece of text contains a falsifiable factual claim that can be fact-checked.

	OUTPUT RULES:
	- Respond ONLY with a valid JSON object. No markdown, no preamble.
	- Schema: {"label": "fact"\|"noise", "reason": "<one sentence>", "falsifiability_score": <0.0-1.0>}

	FACT = a specific, falsifiable assertion about the world (statistics, historical events, named person claims, scientific assertions, quotes, causal claims).
	NOISE = opinions, memes, questions, sarcasm, social filler, greetings, jokes, abstract feelings.

	Examples of FACT:
	- "The unemployment rate hit 4.2% in September 2024"
	- "Elon Musk acquired Twitter for $44 billion"
	- "COVID vaccines contain microchips" (falsifiable even if wrong)

	Examples of NOISE:
	- "lol this is wild"
	- "do you think AI will take our jobs?"
	- "i love this song"
	- "we need to do better as a society"
	"""


	@retry(
	stop=stop_after_attempt(2),
	wait=wait_exponential(multiplier=0.1, min=0.05, max=0.5),
	reraise=False,
	)
	async def classify_claim(text: str) -> GatekeeperResult:
	"""
	Classify a text as a falsifiable factual claim ('fact') or noise.
	Falls back gracefully if Groq is unavailable.
	"""
	# Pre-filter: very short text is almost always noise
	if len(text.split()) < 5:
	return GatekeeperResult(
	label=ClaimLabel.NOISE,
	reason="Text too short to contain a verifiable claim.",
	falsifiability_score=0.0,
	)

	api_key = os.getenv("GROQ_API_KEY", "")
	if not api_key:
	return _heuristic_classify(text)

	try:
	client = get_groq_client()
	response = await client.chat.completions.create(
	model="llama3-8b-8192",
	messages=[
	{"role": "system", "content": GATEKEEPER_SYSTEM},
	{"role": "user", "content": f"Classify this text:\n\n{text[:800]}"},
	],
	temperature=0.0, # deterministic
	max_tokens=120,
	response_format={"type": "json_object"},
	)
	raw_json = response.choices[0].message.content or "{}"
	# Use model_validate_json — raises ValidationError on bad schema, not try/except
	result = GatekeeperResult.model_validate_json(raw_json)
	log.debug(
	"gatekeeper.classified",
	label=result.label,
	score=result.falsifiability_score,
	text_preview=text[:60],
	)
	return result
	except Exception as exc:
	log.warning("gatekeeper.groq_error", error=str(exc), fallback="heuristic")
	return _heuristic_classify(text)


	def _heuristic_classify(text: str) -> GatekeeperResult:
	"""
	CPU-only heuristic fallback when Groq API is unavailable.
	Uses a bag-of-patterns approach; deliberately conservative (leans toward 'fact')
	to avoid silently dropping real claims.
	"""
	noise_patterns = [
	r"^\s*(lol\|lmao\|omg\|wtf\|bruh\|smh\|imo\|tbh\|idk\|ngl\|gg\|rip)\b",
	r"^\s[?!]{1,3}\s$",
	r"(how are you\|what do you think\|do you believe\|feel like)",
	r"^\s(yes\|no\|maybe\|sure\|ok\|okay\|yep\|nope)\s[.!?]?\s*$",
	r"(i love\|i hate\|i feel\|i think)\s+(?:this\|that\|it)",
	]
	text_lower = text.lower()
	for pat in noise_patterns:
	if re.search(pat, text_lower):
	return GatekeeperResult(
	label=ClaimLabel.NOISE,
	reason="Pattern-matched as social noise by heuristic classifier.",
	falsifiability_score=0.1,
	)

	# Signals of a factual claim
	fact_signals = [
	r"\d+\s*(%\|percent\|billion\|million\|thousand)",
	r"\b(according to\|reported\|confirmed\|announced\|study\|research\|data shows)\b",
	r"\b(president\|ceo\|minister\|government\|official)\b.{0,50}\b(said\|stated\|announced)\b",
	r"\b(died\|killed\|arrested\|charged\|convicted\|sentenced)\b",
	r"https?://",
	]
	score = sum(0.15 for pat in fact_signals if re.search(pat, text_lower))
	score = min(score, 0.85)

	label = ClaimLabel.FACT if score >= 0.15 else ClaimLabel.NOISE
	return GatekeeperResult(
	label=label,
	reason="Heuristic classification (Groq unavailable).",
	falsifiability_score=score if label == ClaimLabel.FACT else 0.15,
	)