Spaces:

Abeee32t
/

ArbitrAgent

Runtime error

AbeBhatti

skip HF Hub download on HF Spaces

f8cde5c about 1 month ago

11.5 kB

	"""
	bluff_detector.py — bluff signal extraction for ArbitrAgent.

	Exposes four rule-based signals (timing, size, formulaic, pattern) and an optional
	learned DistilBERT classifier trained on IRC poker bluff labels. Combined score:
	bluff_score = 0.6 * learned_bluff_score + 0.4 * rule_score
	is_bluff when bluff_score > 0.6.
	"""

	from __future__ import annotations

	import re
	from dataclasses import dataclass
	import os
	from pathlib import Path
	from typing import Any, Dict, List, Mapping, Optional, Sequence

	from huggingface_hub import hf_hub_download

	# Lazy-loaded learned classifier (only on first use)
	_bluff_classifier_model = None
	_bluff_classifier_tokenizer = None
	_classifier_cache = None


	def _get_bluff_classifier():
	"""Lazy-load bluff_classifier.pt and tokenizer from training/checkpoints."""
	global _bluff_classifier_model, _bluff_classifier_tokenizer, _classifier_cache
	if _classifier_cache is not None:
	return _classifier_cache

	checkpoints_dir = Path(__file__).resolve().parent.parent / "training" / "checkpoints"
	negotiation_pt = checkpoints_dir / "bluff_classifier_negotiation.pt"
	default_pt = checkpoints_dir / "bluff_classifier.pt"
	# Prefer negotiation-trained classifier if present, else fall back to poker-trained one.
	if negotiation_pt.exists():
	pt_path = negotiation_pt
	elif default_pt.exists():
	pt_path = default_pt
	else:
	# HF Hub fallback: only when not running on HF Spaces and no local checkpoints.
	if os.environ.get("HF_SPACES") == "1":
	return None, None
	# Try to download negotiation checkpoint from the HF Hub repo.
	try:
	downloaded = hf_hub_download(
	repo_id="Abeee32t/arbitragent-bluff-classifier",
	filename="bluff_classifier_negotiation.pt",
	repo_type="model",
	)
	pt_path = Path(downloaded)
	except Exception:
	return None, None

	tok_dir = checkpoints_dir / "bluff_classifier_tokenizer"
	try:
	import torch
	from transformers import AutoTokenizer, AutoModel
	if tok_dir.exists():
	_bluff_classifier_tokenizer = AutoTokenizer.from_pretrained(str(tok_dir))
	else:
	# Fallback: use base DistilBERT tokenizer when local tokenizer dir is missing.
	_bluff_classifier_tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased")

	class _BluffClassifierModule(torch.nn.Module):
	def __init__(self):
	super().__init__()
	self.encoder = AutoModel.from_pretrained("distilbert-base-uncased")
	self.head = torch.nn.Linear(self.encoder.config.hidden_size, 2)

	def forward(self, input_ids, attention_mask=None, **kwargs):
	out = self.encoder(input_ids=input_ids, attention_mask=attention_mask)
	return self.head(out.last_hidden_state[:, 0, :])

	_bluff_classifier_model = _BluffClassifierModule()
	_bluff_classifier_model.load_state_dict(torch.load(pt_path, map_location="cpu", weights_only=True))
	_bluff_classifier_model.eval()
	_classifier_cache = (_bluff_classifier_model, _bluff_classifier_tokenizer)
	return _classifier_cache
	except Exception:
	return None, None


	def _thread_and_message_to_text(thread_history: Sequence[Mapping[str, Any]], seller_message: str) -> str:
	"""Convert thread + seller message into text matching poker training format (Position. Preflop. Flop. Turn. River. Pot)."""
	parts: List[str] = []
	for entry in thread_history:
	if "agent" in entry:
	parts.append(str(entry["agent"])[:80])
	if "seller" in entry:
	parts.append(str(entry["seller"])[:80])
	# Map to poker-like: Preflop / Flop / Turn / River
	preflop = parts[0] if len(parts) > 0 else "-"
	flop = parts[1] if len(parts) > 1 else "-"
	turn = parts[2] if len(parts) > 2 else "-"
	river = seller_message[:200] if seller_message else "-"
	return f"Position 1 of 2. Preflop: {preflop}. Flop: {flop}. Turn: {turn}. River: {river}. Pot: 0."


	def learned_bluff_score(message: str, thread_history: Sequence[Mapping[str, Any]]) -> float:
	"""
	Run learned DistilBERT classifier on (message + thread). Returns P(bluff) in [0, 1].
	Returns 0.0 if classifier not loaded.
	"""
	model, tokenizer = _get_bluff_classifier()
	if model is None or tokenizer is None:
	return 0.0
	text = _thread_and_message_to_text(thread_history, message)
	try:
	import torch
	enc = tokenizer(
	text,
	truncation=True,
	max_length=128,
	padding="max_length",
	return_tensors="pt",
	)
	with torch.no_grad():
	logits = model(
	input_ids=enc["input_ids"],
	attention_mask=enc["attention_mask"],
	)
	probs = torch.softmax(logits, dim=1)
	return float(probs[0, 1].item()) # class 1 = bluff
	except Exception:
	return 0.0


	FORMULAIC_PHRASES: List[str] = [
	"lowest i can go",
	"lowest i can do",
	"final offer",
	"cant go lower",
	"can't go lower",
	"cant do lower",
	"can't do lower",
	"thats my final offer",
	"that's my final offer",
	"best i can do",
	]


	@dataclass
	class BluffSignals:
	timing_tell: float
	size_tell: float
	formulaic_tell: float
	pattern_tell: float
	bluff_score: float
	is_bluff: bool


	DEFAULT_WEIGHTS: Dict[str, float] = {
	"timing_tell": 0.25,
	"size_tell": 0.25,
	"formulaic_tell": 0.25,
	"pattern_tell": 0.25,
	}


	def analyze_bluff(
	seller_profile: Mapping[str, Any],
	thread_history: Sequence[Mapping[str, Any]],
	seller_message: str,
	turn: Optional[int] = None,
	weights: Optional[Mapping[str, float]] = None,
	) -> BluffSignals:
	"""
	Analyze a seller response and return bluff signals plus an overall score.

	Parameters
	----------
	seller_profile:
	The seller profile dict (see simulation.seller_profiles.SELLER_PROFILES).
	thread_history:
	Sequence of {"turn": int, "agent": str} / {"turn": int, "seller": str}
	entries, such as CraigslistSellerSim.thread_history.
	seller_message:
	The seller's latest message to analyze.
	turn:
	Turn index at which this message was sent. If omitted, the maximum
	`turn` value from thread_history is used.
	weights:
	Optional per-signal weights. Keys should be
	{"timing_tell", "size_tell", "formulaic_tell", "pattern_tell"}.
	If omitted, DEFAULT_WEIGHTS are used.
	"""
	if turn is None:
	turn = max((entry.get("turn", 0) for entry in thread_history), default=0)

	timing = _timing_tell(seller_profile, turn)
	size = _size_tell(seller_message)
	formulaic = _formulaic_tell(seller_message)
	pattern = _pattern_tell(thread_history, seller_message)

	if weights is None:
	weights = DEFAULT_WEIGHTS

	total_w = float(sum(weights.get(k, 0.0) for k in DEFAULT_WEIGHTS.keys()))
	if total_w <= 0.0:
	norm_weights = DEFAULT_WEIGHTS
	total_w = 1.0
	else:
	norm_weights = {
	key: float(weights.get(key, 0.0)) / total_w
	for key in DEFAULT_WEIGHTS.keys()
	}

	rule_score = (
	timing * norm_weights["timing_tell"]
	+ size * norm_weights["size_tell"]
	+ formulaic * norm_weights["formulaic_tell"]
	+ pattern * norm_weights["pattern_tell"]
	)
	learned = learned_bluff_score(seller_message, thread_history)
	if _bluff_classifier_model is not None:
	bluff_score = 0.6 * learned + 0.4 * rule_score
	# When all four rule tells fire (canonical bluff message), ensure we still flag it
	# even if learned model says 0 (poker-trained on different text distribution)
	if rule_score >= 1.0 and bluff_score < 0.6:
	bluff_score = max(bluff_score, 0.65)
	else:
	bluff_score = rule_score
	is_bluff = bluff_score > 0.6

	return BluffSignals(
	timing_tell=timing,
	size_tell=size,
	formulaic_tell=formulaic,
	pattern_tell=pattern,
	bluff_score=bluff_score,
	is_bluff=is_bluff,
	)


	def analyze_from_sim(
	sim: Any,
	seller_message: str,
	weights: Optional[Mapping[str, float]] = None,
	) -> BluffSignals:
	"""
	Convenience wrapper to analyze a CraigslistSellerSim instance directly.

	This avoids circular imports by using a structural interface only:
	the `sim` object must expose `profile`, `thread_history`, and `turn`.
	"""
	return analyze_bluff(
	seller_profile=getattr(sim, "profile"),
	thread_history=getattr(sim, "thread_history"),
	seller_message=seller_message,
	turn=getattr(sim, "turn"),
	weights=weights,
	)


	def _timing_tell(seller_profile: Mapping[str, Any], turn: int) -> float:
	"""
	Timing tell — did a strong floor assertion arrive suspiciously fast?

	Heuristic: sellers with response_speed == "fast" who make this claim in
	the first few turns score as a timing tell.
	"""
	speed = str(seller_profile.get("response_speed", "")).lower()
	if speed == "fast" and turn <= 3:
	return 1.0
	if speed == "fast":
	return 0.7
	return 0.0


	def _size_tell(seller_message: str) -> float:
	"""
	Size tell — concession lands cleanly on a round number (anchoring).
	"""
	price = _extract_price(seller_message)
	if price is None:
	return 0.0

	if price % 10 == 0:
	return 1.0
	if price % 5 == 0:
	return 0.7
	return 0.0


	def _formulaic_tell(seller_message: str) -> float:
	"""
	Formulaic tell — canned bluff phrases like "final offer".
	"""
	text = seller_message.lower()
	for phrase in FORMULAIC_PHRASES:
	if phrase in text:
	return 1.0
	return 0.0


	def _pattern_tell(
	thread_history: Sequence[Mapping[str, Any]],
	seller_message: str,
	) -> float:
	"""
	Pattern tell — behavior shift vs. earlier thread history.

	Heuristics:
	- There is at least one prior seller message with a numeric price.
	- Those prior messages show at least one concession (price decreasing).
	- The current message is formulaic (strong finality language).
	"""
	seller_msgs: List[str] = [
	str(entry["seller"])
	for entry in thread_history
	if "seller" in entry
	]
	if not seller_msgs:
	return 0.0

	# Exclude the current message if it's already in thread_history.
	prior_msgs = seller_msgs[:-1] if seller_msgs[-1].strip() == seller_message.strip() else seller_msgs
	if not prior_msgs:
	return 0.0

	prev_prices: List[int] = []
	for msg in prior_msgs:
	price = _extract_price(msg)
	if price is not None:
	prev_prices.append(price)

	if len(prev_prices) < 1:
	return 0.0

	concessions = 0
	for i in range(1, len(prev_prices)):
	if prev_prices[i] < prev_prices[i - 1]:
	concessions += 1

	if concessions == 0:
	return 0.0

	if _formulaic_tell(seller_message) <= 0.0:
	return 0.0

	return 1.0


	def _extract_price(text: str) -> Optional[int]:
	"""
	Extract the last integer that looks like a price from the text.
	"""
	matches = re.findall(r"\$?\s*(\d+)", text)
	if not matches:
	return None
	try:
	return int(matches[-1])
	except ValueError:
	return None