Spaces:

Aswini-Kumar
/

datacentric-env

Sleeping

App Files Files Community

datacentric-env / server /environment.py

Aswini-Kumar

Upload server/environment.py with huggingface_hub

f22507c verified 23 days ago

raw

history blame contribute delete

22.8 kB

	"""
	server/environment.py — Session-aware environment (v0.5).

	New in v0.5:
	1. Rollback action — undo last apply (real data engineers do this)
	2. Episode reasoning trace — running history of what the agent tried + effects
	3. Feature importance — returned after every apply so agent sees what the model learned
	4. Regression explanation — when accuracy drops, explains the likely cause
	5. Baseline comparison — agent always knows how far ahead of majority-class predictor it is
	"""
	import threading
	import pandas as pd
	import numpy as np

	from server.dataset_registry import DatasetRegistry
	from server.evaluator import Evaluator
	from server.reward import compute, compute_stats
	from server.anti_exploit import AntiExploit, ExploitDetected
	from server.config import cfg
	from server.logger import get_logger, log_event
	from server.specialist_agents import (
	CleanerAgent, AugmenterAgent, BalancerAgent, ValidatorAgent, AnalystAgent
	)

	logger = get_logger("environment")

	QUERY_COSTS = {
	"query_cleaner": 1,
	"query_augmenter": 1,
	"query_balancer": 1,
	"query_validator": 2,
	"query_analyst": 2,
	}
	QUERY_ACTIONS = set(QUERY_COSTS.keys())

	_registry = DatasetRegistry()


	class DataCentricEnvironment:

	def __init__(self, session_id: str, episode_count: int = 0):
	self.session_id = session_id
	self._episode_count = episode_count
	self.agents = {
	"cleaner": CleanerAgent(),
	"augmenter": AugmenterAgent(),
	"balancer": BalancerAgent(),
	"validator": ValidatorAgent(),
	"analyst": AnalystAgent(),
	}
	self.anti_exploit = AntiExploit()
	self._lock = threading.Lock()
	self._reset_state()

	def _reset_state(self):
	self.train_df: pd.DataFrame = None
	self.holdout_df: pd.DataFrame = None
	self.domain_metadata: dict = {}
	self.evaluator: Evaluator = None
	self.target_accuracy: float = None
	self.initial_row_count: int = 0
	self.baseline_accuracy: float = 0.0 # majority-class predictor on holdout
	self.starting_accuracy: float = 0.0 # accuracy before ANY agent action
	self.budget: int = cfg.MAX_BUDGET
	self.current_accuracy: float = 0.0
	self.episode_step: int = 0
	self.done: bool = False
	self.difficulty: str = "easy"
	self.pending_recs: dict = {}
	self.applied_rec_ids: set = set()
	self.last_query_result: dict = {}
	self.last_feature_importance: dict = {}
	self.anti_exploit.reset()
	self.accuracy_history: list = []
	self.reward_history: list = []
	# Rollback: stack of (df_snapshot, accuracy) — last 3 states
	self._state_stack: list[tuple] = []
	# Reasoning trace: running log of every step
	self._episode_trace: list[dict] = []

	# ── Public API ─────────────────────────────────────────────────────────────

	def reset(self, difficulty: str = None, seed: int = None) -> dict:
	with self._lock:
	self._episode_count += 1
	self._reset_state()
	self.difficulty = difficulty or self._curriculum_difficulty()

	self.train_df, self.holdout_df, self.domain_metadata = _registry.get(
	difficulty=self.difficulty, seed=seed
	)
	self.initial_row_count = len(self.train_df)
	self.evaluator = Evaluator(self.holdout_df)

	pub_baseline = self.domain_metadata.get("published_baseline", 0.80)
	self.target_accuracy = round(pub_baseline * 0.97, 4)
	self.baseline_accuracy = self.evaluator.baseline_accuracy()

	self.current_accuracy = self.evaluator.evaluate(self._clean_df(self.train_df))
	self.starting_accuracy = self.current_accuracy
	self.accuracy_history.append(self.current_accuracy)

	self._episode_trace.append({
	"step": 0,
	"type": "reset",
	"dataset": self.domain_metadata.get("display_name"),
	"accuracy": round(self.current_accuracy, 4),
	"baseline_accuracy": self.baseline_accuracy,
	"target_accuracy": self.target_accuracy,
	})

	log_event(logger, "episode_reset",
	session_id=self.session_id,
	dataset=self.domain_metadata.get("display_name"),
	difficulty=self.difficulty,
	initial_accuracy=round(self.current_accuracy, 4),
	target_accuracy=self.target_accuracy,
	baseline_accuracy=self.baseline_accuracy,
	published_baseline=pub_baseline,
	n_train=len(self.train_df),
	n_holdout=len(self.holdout_df))
	return self._observation()

	def step(self, action: dict) -> dict:
	with self._lock:
	if self.done:
	return self._error("Episode done. Call /reset.")
	if self.train_df is None:
	return self._error("Not initialized. Call /reset first.")

	# Rollback action — no anti-exploit check needed
	action_type = action.get("action", "")
	if action_type == "rollback":
	return self._handle_rollback()

	try:
	self.anti_exploit.check(
	action=action,
	budget_remaining=self.budget,
	pending_recs=self.pending_recs,
	applied_rec_ids=self.applied_rec_ids,
	)
	except ExploitDetected as e:
	log_event(logger, "exploit_detected", session_id=self.session_id,
	rule=e.rule, detail=e.detail)
	self.episode_step += 1
	self.budget = max(0, self.budget - 1)
	self.done = self.budget <= 0
	self._episode_trace.append({
	"step": self.episode_step,
	"type": "exploit_blocked",
	"rule": e.rule,
	"detail": e.detail,
	})
	return {
	"observation": self._observation(),
	"reward": 0.001,
	"done": self.done,
	"exploit_detected": True,
	"error": f"[{e.rule}] {e.detail}",
	"info": {"episode_step": self.episode_step, "budget_remaining": self.budget},
	}

	if action_type in QUERY_ACTIONS:
	return self._handle_query(action_type, action)
	elif action_type == "apply":
	return self._handle_apply(action)
	else:
	return self._error(f"Unknown action '{action_type}'. Valid: {list(QUERY_ACTIONS) + ['apply', 'rollback']}")

	def state(self) -> dict:
	with self._lock:
	return self._observation()

	# ── Rollback ───────────────────────────────────────────────────────────────

	def _handle_rollback(self) -> dict:
	"""Undo the last apply operation. Costs 1 budget. Max 3 rollbacks per episode."""
	rollbacks_used = sum(1 for e in self._episode_trace if e["type"] == "rollback")
	if rollbacks_used >= 3:
	return self._error("Maximum 3 rollbacks per episode reached.")
	if not self._state_stack:
	return self._error("Nothing to roll back. No apply operations have been made yet.")

	prev_df, prev_accuracy = self._state_stack.pop()
	self.train_df = prev_df
	self.current_accuracy = prev_accuracy
	self.accuracy_history.append(self.current_accuracy)
	self.budget = max(0, self.budget - 1)
	self.episode_step += 1
	self.done = self.budget <= 0

	self._episode_trace.append({
	"step": self.episode_step,
	"type": "rollback",
	"accuracy_after_rollback": round(self.current_accuracy, 4),
	"note": "Last apply undone. Dataset restored to previous state.",
	})

	log_event(logger, "rollback", session_id=self.session_id,
	accuracy_after=round(self.current_accuracy, 4))

	return {
	"observation": self._observation(),
	"reward": 0.3, # small penalty for indecision, but not zero
	"done": self.done,
	"rollback": True,
	"accuracy_after_rollback": round(self.current_accuracy, 4),
	"info": {
	"episode_step": self.episode_step,
	"budget_remaining": self.budget,
	"rollbacks_remaining": 3 - rollbacks_used - 1,
	"note": "Dataset restored to state before last apply.",
	},
	}

	# ── Query handler ──────────────────────────────────────────────────────────

	def _handle_query(self, action_type: str, action: dict) -> dict:
	cost = QUERY_COSTS[action_type]
	prev_stats = compute_stats(self.train_df)
	clean = self._clean_df(self.train_df)
	meta = self.domain_metadata

	if action_type == "query_cleaner":
	result = self.agents["cleaner"].query(clean, meta)
	elif action_type == "query_augmenter":
	result = self.agents["augmenter"].query(clean, action.get("target_class"), meta)
	elif action_type == "query_balancer":
	result = self.agents["balancer"].query(clean, meta)
	elif action_type == "query_validator":
	result = self.agents["validator"].query(clean, meta)
	elif action_type == "query_analyst":
	result = self.agents["analyst"].query(clean, meta)
	else:
	result = {}

	new_rec_ids = []
	for rec in result.get("recommendations", []):
	rid = rec["id"]
	self.pending_recs[rid] = {"rec": rec, "agent": result.get("agent", "unknown")}
	new_rec_ids.append(rid)

	self.last_query_result = result
	self.budget = max(0, self.budget - cost)
	self.episode_step += 1
	new_stats = compute_stats(self.train_df)

	reward, decomp = compute(
	prev_accuracy=self.current_accuracy,
	new_accuracy=self.current_accuracy,
	prev_stats=prev_stats,
	new_stats=new_stats,
	action=action,
	steps_taken=self.episode_step,
	max_steps=cfg.MAX_BUDGET,
	budget_remaining=self.budget,
	target_accuracy=self.target_accuracy,
	step_type="query",
	n_recs_returned=len(new_rec_ids),
	)
	self.reward_history.append(reward)
	self.done = self.budget <= 0

	agent_name = action_type.replace("query_", "")
	self._episode_trace.append({
	"step": self.episode_step,
	"type": "query",
	"agent": agent_name,
	"n_recs": len(new_rec_ids),
	"budget_cost": cost,
	"budget_remaining": self.budget,
	"reward": reward,
	"rec_ids": new_rec_ids,
	})

	log_event(logger, "query_step", session_id=self.session_id,
	action=action_type, n_recs=len(new_rec_ids),
	budget=self.budget, reward=reward)

	return {
	"observation": self._observation(),
	"reward": reward,
	"reward_decomposition": decomp,
	"done": self.done,
	"query_result": result,
	"new_recommendation_ids": new_rec_ids,
	"info": {
	"action_type": "query",
	"agent_queried": agent_name,
	"budget_cost": cost,
	"budget_remaining": self.budget,
	"n_recommendations": len(new_rec_ids),
	"episode_step": self.episode_step,
	"domain": self.domain_metadata.get("display_name"),
	},
	}

	# ── Apply handler ──────────────────────────────────────────────────────────

	def _handle_apply(self, action: dict) -> dict:
	rec_id = action.get("rec_id", "")
	entry = self.pending_recs[rec_id]
	agent_name = entry["agent"]
	rec = entry["rec"]

	prev_accuracy = self.current_accuracy
	prev_stats = compute_stats(self.train_df)
	prev_rows = len(self.train_df)
	meta = self.domain_metadata

	# Save state for rollback BEFORE applying
	self._state_stack.append((self.train_df.copy(), prev_accuracy))
	if len(self._state_stack) > 3:
	self._state_stack.pop(0) # keep at most last 3

	result_holder: dict = {}
	error_holder: dict = {}

	def _run():
	try:
	clean = self._clean_df(self.train_df)
	df_out, log_msg = self.agents[agent_name].apply(clean, rec, meta)
	result_holder["df"] = df_out
	result_holder["log"] = log_msg
	except Exception as e:
	error_holder["error"] = str(e)

	t = threading.Thread(target=_run, daemon=True)
	t.start()
	t.join(timeout=cfg.STEP_TIMEOUT_SECONDS)

	if t.is_alive():
	self._state_stack.pop() # failed — don't keep stale snapshot
	return self._error("Apply timed out.")
	if "error" in error_holder:
	self._state_stack.pop()
	return self._error(f"Apply error: {error_holder['error']}")

	new_df = result_holder["df"]
	tool_log = result_holder["log"]

	# Data integrity constraint: cannot delete more than 10% of rows
	new_rows = len(new_df)
	deletion_pct = max(0, (prev_rows - new_rows) / max(prev_rows, 1))
	if deletion_pct > 0.10:
	self._state_stack.pop()
	return self._error(
	f"Data integrity violation: would delete {deletion_pct:.1%} of training rows "
	f"(limit: 10%). Use targeted imputation instead of drop_rows."
	)

	self.train_df = new_df
	self.applied_rec_ids.add(rec_id)
	self.episode_step += 1

	# Full evaluation with feature importance + regression explanation
	eval_result = self.evaluator.evaluate_with_details(
	self._clean_df(self.train_df), prev_accuracy
	)
	self.current_accuracy = eval_result["accuracy"]
	self.last_feature_importance = eval_result.get("feature_importance", {})
	regression_explanation = eval_result.get("regression_explanation")

	self.accuracy_history.append(self.current_accuracy)
	new_stats = compute_stats(self.train_df)

	reward, decomp = compute(
	prev_accuracy=prev_accuracy,
	new_accuracy=self.current_accuracy,
	prev_stats=prev_stats,
	new_stats=new_stats,
	action=action,
	steps_taken=self.episode_step,
	max_steps=cfg.MAX_BUDGET,
	budget_remaining=self.budget,
	target_accuracy=self.target_accuracy,
	step_type="apply",
	)
	self.reward_history.append(reward)
	self.done = (self.current_accuracy >= self.target_accuracy) or (self.budget <= 0)

	acc_delta = round(self.current_accuracy - prev_accuracy, 4)
	self._episode_trace.append({
	"step": self.episode_step,
	"type": "apply",
	"agent": agent_name,
	"rec_type": rec.get("type", "?"),
	"rec_id": rec_id,
	"accuracy_before": round(prev_accuracy, 4),
	"accuracy_after": round(self.current_accuracy, 4),
	"accuracy_delta": acc_delta,
	"effect": "improved" if acc_delta > 0.001 else ("hurt" if acc_delta < -0.001 else "neutral"),
	"reward": reward,
	"rows_before": prev_rows,
	"rows_after": new_rows,
	})

	log_event(logger, "apply_step", session_id=self.session_id,
	rec_id=rec_id, agent=agent_name,
	prev_acc=round(prev_accuracy, 4),
	new_acc=round(self.current_accuracy, 4),
	target=self.target_accuracy,
	reward=reward,
	success=self.current_accuracy >= self.target_accuracy)

	response = {
	"observation": self._observation(),
	"reward": reward,
	"reward_decomposition": decomp,
	"done": self.done,
	"tool_log": tool_log,
	"feature_importance": self.last_feature_importance,
	"info": {
	"action_type": "apply",
	"rec_id": rec_id,
	"agent": agent_name,
	"rec_type": rec.get("type", "?"),
	"prev_accuracy": round(prev_accuracy, 4),
	"new_accuracy": round(self.current_accuracy, 4),
	"accuracy_delta": acc_delta,
	"target_accuracy": self.target_accuracy,
	"published_baseline": self.domain_metadata.get("published_baseline"),
	"improvement_over_start": round(self.current_accuracy - self.starting_accuracy, 4),
	"improvement_over_majority_baseline": round(self.current_accuracy - self.baseline_accuracy, 4),
	"budget_remaining": self.budget,
	"episode_step": self.episode_step,
	"success": self.current_accuracy >= self.target_accuracy,
	"rollbacks_available": max(0, 3 - sum(1 for e in self._episode_trace if e["type"] == "rollback")),
	"data_integrity": {
	"rows_before": prev_rows,
	"rows_after": new_rows,
	"deletion_pct": round(deletion_pct, 4),
	},
	},
	}

	# Only include regression explanation when accuracy dropped
	if regression_explanation:
	response["regression_explanation"] = regression_explanation

	return response

	# ── Helpers ────────────────────────────────────────────────────────────────

	def _clean_df(self, df):
	drop_cols = [c for c in df.columns if c.startswith("_")]
	return df.drop(columns=drop_cols) if drop_cols else df

	def _observation(self) -> dict:
	stats = compute_stats(self.train_df) if self.train_df is not None else {}
	pending_summary = {
	rid: {
	"agent": entry["agent"],
	"type": entry["rec"].get("type", "?"),
	"priority": entry["rec"].get("priority", "?"),
	"reason": entry["rec"].get("reason", ""),
	"domain_informed": entry["rec"].get("domain_informed", False),
	}
	for rid, entry in self.pending_recs.items()
	if rid not in self.applied_rec_ids
	}
	meta = self.domain_metadata

	# Compact trace — last 5 steps for context without overwhelming the prompt
	recent_trace = self._episode_trace[-5:] if self._episode_trace else []

	return {
	"session_id": self.session_id,

	# What the agent is working on
	"dataset": {
	"name": meta.get("display_name", "Unknown"),
	"domain": meta.get("domain", "generic"),
	"description": meta.get("description", ""),
	"known_issues": meta.get("known_issues", []),
	"published_baseline": meta.get("published_baseline"),
	},

	# Current state
	"current_accuracy": round(self.current_accuracy, 4),
	"target_accuracy": self.target_accuracy,
	"accuracy_gap": round(max(0, self.target_accuracy - self.current_accuracy), 4),
	"budget_remaining": self.budget,
	"difficulty": self.difficulty,

	# Comparisons — what does this number actually mean?
	"benchmarks": {
	"majority_class_baseline": self.baseline_accuracy,
	"starting_accuracy": round(self.starting_accuracy, 4),
	"improvement_over_start": round(self.current_accuracy - self.starting_accuracy, 4),
	"improvement_over_baseline": round(self.current_accuracy - self.baseline_accuracy, 4),
	"published_baseline": meta.get("published_baseline"),
	},

	"dataset_stats": {
	"n_train_rows": len(self.train_df) if self.train_df is not None else 0,
	"n_holdout_rows": len(self.holdout_df) if self.holdout_df is not None else 0,
	"n_cols": len(self.train_df.columns) if self.train_df is not None else 0,
	"missing_pct": round(stats.get("missing_pct", 0), 4),
	"balance_ratio": round(stats.get("balance_ratio", 0), 4),
	},

	# Feature importance from last evaluation
	"feature_importance": self.last_feature_importance,

	# Episodic memory — what has the agent tried so far?
	"episode_trace": recent_trace,

	"pending_recommendations": pending_summary,
	"last_query_result": self.last_query_result,
	"available_actions": (
	"query_cleaner \| query_augmenter \| query_balancer \| "
	"query_validator (cost 2) \| query_analyst (cost 2) \| "
	"apply {rec_id} \| rollback (undo last apply, max 3/episode)"
	),
	}

	def _error(self, msg: str) -> dict:
	return {"error": msg, "session_id": self.session_id}

	def _curriculum_difficulty(self) -> str:
	if self._episode_count < cfg.CURRICULUM_MEDIUM_AFTER:
	return "easy"
	elif self._episode_count < cfg.CURRICULUM_HARD_AFTER:
	return "medium"
	return "hard"

	def episode_summary(self) -> dict:
	return {
	"session_id": self.session_id,
	"episode_count": self._episode_count,
	"accuracy_history": [round(a, 4) for a in self.accuracy_history],
	"reward_history": [round(r, 4) for r in self.reward_history],
	"mean_reward": round(sum(self.reward_history) / max(len(self.reward_history), 1), 4),
	"full_trace": self._episode_trace,
	}