Spaces:

nice-bill
/

agent-arena

Running

App Files Files Community

agent-arena / core /simulation.py

nice-bill

deploy from github

17390ee verified about 2 months ago

raw

history blame contribute delete

26 kB

	"""Main simulation engine for DeFi agent market."""

	import json
	import random
	from typing import List, Dict, Optional
	from dataclasses import dataclass

	from core.agent import Agent
	from core.defi_mechanics import Pool
	from core.summarizer import Summarizer
	from api.supabase_client import (
	SupabaseClient, RunData, AgentStateData, PoolStateData, ActionData, MetricsData
	)
	from config import NUM_AGENTS, TURNS_PER_RUN


	@dataclass
	class Simulation:
	"""Orchestrates the DeFi agent simulation."""

	num_agents: int = NUM_AGENTS
	turns_per_run: int = TURNS_PER_RUN
	supabase: Optional[SupabaseClient] = None

	# Alliance bonus config
	ALLIANCE_BONUS: float = 4.0 # Bonus for successful alliance

	# Action bonuses
	LIQUIDITY_BONUS: float = 8.0 # Bonus for providing liquidity
	SWAP_BONUS: float = 3.0 # Bonus for active trading
	COORDINATED_TRADE_BONUS: float = 5.0 # Bonus for trading with allies
	PROFIT_BONUS: float = 15.0 # Bonus for ending turn with positive profit

	# Market maker config
	ENABLE_MARKET_MAKER: bool = True
	MARKET_MAKER_INTERVAL: int = 3 # Market maker acts every N turns
	MARKET_MAKER_VOLATILITY: float = 0.15 # 15% price shock

	# Chaos agent config
	ENABLE_CHAOS_AGENT: bool = True
	CHAOS_AGENT_CHANCE: float = 0.35 # 35% chance each turn
	CHAOS_AGENT_MIN_VOLATILITY: float = 0.25 # Min 25% of reserves
	CHAOS_AGENT_MAX_VOLATILITY: float = 0.50 # Max 50% of reserves

	def __post_init__(self):
	self.agents: List[Agent] = []
	self.pool: Optional[Pool] = None
	self.current_run_id: Optional[int] = None
	self.current_run_number: int = 0
	self.market_maker_trades: List[Dict] = []
	self.price_shocks: List[Dict] = []

	if self.supabase is None:
	try:
	self.supabase = SupabaseClient()
	except ValueError:
	print("Warning: Supabase not configured. Running without persistence.")
	self.supabase = None

	def initialize_run(self, run_number: int = None):
	"""Initialize a new run with agents and pool."""
	if run_number is None:
	if self.supabase:
	run_number = self.supabase.get_next_run_number()
	else:
	run_number = self.current_run_number + 1

	self.current_run_number = run_number
	self.agents = [Agent(f"Agent_{i}") for i in range(self.num_agents)]
	self.pool = Pool()

	print(f"Initialized run {run_number} with {self.num_agents} agents")

	if self.supabase:
	self.current_run_id = self.supabase.create_run(run_number)
	print(f"Created run in database: ID {self.current_run_id}")

	def run(self, run_number: int = None) -> Dict:
	"""Execute a complete simulation run."""
	# Debug: Check supabase status
	has_supabase = self.supabase is not None
	print(f"[DEBUG] run() called, supabase={'yes' if has_supabase else 'NO'}")

	self.initialize_run(run_number)

	print(f"\n=== Starting run {self.current_run_number} with {self.turns_per_run} turns ===")
	if self.ENABLE_MARKET_MAKER:
	print("Market Maker: ENABLED (creates volatility every 3 turns)")
	if self.ENABLE_CHAOS_AGENT:
	print("Chaos Agent: ENABLED (random unpredictable moves)")
	print(f"Alliance Bonus: {self.ALLIANCE_BONUS} tokens for successful cooperation")
	print(f"Boredom Penalty: Agents lose tokens after 2+ consecutive do_nothing actions")
	print()

	# Register graceful shutdown handler (may not work in all environments)
	try:
	import signal
	def shutdown_handler(signum, frame):
	print(f"\n[SHUTDOWN] Received signal, saving progress...")
	_save_progress(self)
	print(f"[SHUTDOWN] Run marked as incomplete")
	raise SystemExit(0)

	signal.signal(signal.SIGTERM, shutdown_handler)
	signal.signal(signal.SIGINT, shutdown_handler)
	except (ValueError, AttributeError) as e:
	print(f"[WARN] Signal handlers not available: {e}")

	def _save_progress(sim):
	"""Save current progress as incomplete run."""
	if sim.supabase and sim.current_run_id:
	metrics = sim._calculate_metrics()
	try:
	sim.supabase.update_run_status(sim.current_run_id, "incomplete")
	sim.supabase.save_metrics(MetricsData(
	run_id=sim.current_run_id,
	gini_coefficient=metrics.get("gini_coefficient", 0),
	cooperation_rate=metrics.get("cooperation_rate", 0),
	betrayal_count=metrics.get("betrayal_count", 0),
	avg_agent_profit=metrics.get("avg_agent_profit", 0),
	pool_stability=metrics.get("pool_stability", 0)
	))
	# Save current states
	for turn in range(len(sim.agents[0]._turn_actions) if hasattr(sim.agents[0], '_turn_actions') else 0, -1, -1):
	sim._save_states(turn)
	break
	except Exception as e:
	print(f"[SHUTDOWN] Failed to save progress: {e}")

	for turn in range(self.turns_per_run):
	print(f"\n--- Turn {turn + 1}/{self.turns_per_run} ---")

	# Market maker creates volatility every N turns
	if self.ENABLE_MARKET_MAKER and (turn + 1) % self.MARKET_MAKER_INTERVAL == 0:
	self._market_maker_action(turn)

	# Random price shock event (25% chance each turn)
	if random.random() < 0.25:
	self._trigger_price_shock(turn)

	# Chaos agent creates unpredictable moves (35% chance)
	if self.ENABLE_CHAOS_AGENT and random.random() < 0.35:
	self._chaos_agent_action(turn)

	# Each agent makes a decision
	for agent in self.agents:
	decision, thinking = self._agent_decide(agent, turn)
	action_type = decision.get('action', 'unknown')

	# Save profit before action for profit detection
	agent._last_profit = agent.calculate_profit()

	# Execute action
	if decision:
	success = agent.execute_action(decision, self.pool)

	# Grant bonuses for successful actions
	if success and action_type != 'do_nothing':
	self._grant_action_bonus(agent, action_type, decision, turn)

	# Track inaction
	if action_type == 'do_nothing':
	agent.increment_inaction_counter()
	else:
	agent.reset_inaction_counter()

	print(f" {agent.name}: {action_type} {'OK' if success else 'FAIL'}")

	# Save action to database
	if self.supabase:
	self._save_action(agent, turn, decision, thinking)

	# Apply boredom penalties AFTER all agents act
	for agent in self.agents:
	penalty = agent.apply_boredom_penalty()
	if penalty > 0:
	print(f" {agent.name}: Boredom penalty -{penalty:.1f} tokens")

	# Check for successful alliances and grant bonuses
	self._process_alliances(turn)

	# Grant profit bonus for agents with positive profit
	self._grant_profit_bonuses(turn)

	# Save state snapshots
	if self.supabase:
	self._save_states(turn)

	# Calculate and save metrics
	metrics = self._calculate_metrics()

	if self.supabase:
	self.supabase.complete_run(self.current_run_id)
	self.supabase.save_metrics(
	MetricsData(
	run_id=self.current_run_id,
	gini_coefficient=metrics.get("gini_coefficient", 0),
	cooperation_rate=metrics.get("cooperation_rate", 0),
	betrayal_count=metrics.get("betrayal_count", 0),
	avg_agent_profit=metrics.get("avg_agent_profit", 0),
	pool_stability=metrics.get("pool_stability", 0)
	)
	)

	# Generate and save run summary
	try:
	print(f"Generating summary for run {self.current_run_number}...")
	summarizer = Summarizer(supabase=self.supabase)
	summary = summarizer.summarize_and_save(self.current_run_id)
	print(f"Generated summary for run {self.current_run_number}")
	except Exception as e:
	print(f"Warning: Failed to generate summary - {e}")
	import traceback
	traceback.print_exc()

	# Update agent learning
	for agent in self.agents:
	agent.update_learning(self.current_run_number, metrics)

	print(f"\n--- Run {self.current_run_number} Complete ---")
	print(f"Final metrics: {json.dumps(metrics, indent=2)}")

	self.current_run_number += 1
	return metrics

	def _agent_decide(self, agent: Agent, turn: int) -> tuple:
	"""Get decision from agent."""
	observation = {
	"turn": turn,
	"event": "trading"
	}
	pool_state = self.pool.get_state()

	try:
	decision, thinking = agent.decide(
	observation,
	pool_state,
	self.agents,
	turn
	)
	return decision, thinking
	except Exception as e:
	print(f" {agent.name}: Decision error - {e}")
	return {"action": "do_nothing", "reasoning": f"Error: {e}"}, ""

	def _save_action(self, agent: Agent, turn: int, decision: Dict, thinking: str):
	"""Save agent action to database."""
	if not self.supabase:
	return
	self.supabase.save_action(ActionData(
	run_id=self.current_run_id,
	turn=turn,
	agent_name=agent.name,
	action_type=decision.get("action", "unknown"),
	payload=decision.get("payload", {}),
	reasoning_trace=decision.get("reasoning", ""),
	thinking_trace=thinking
	))

	def _save_states(self, turn: int):
	"""Save agent and pool states to database."""
	if not self.supabase:
	return

	# Save agent states
	for agent in self.agents:
	self.supabase.save_agent_state(AgentStateData(
	run_id=self.current_run_id,
	turn=turn,
	agent_name=agent.name,
	token_a_balance=agent.token_a,
	token_b_balance=agent.token_b,
	profit=agent.calculate_profit(),
	strategy=agent.infer_strategy()
	))

	# Save pool state
	self.supabase.save_pool_state(PoolStateData(
	run_id=self.current_run_id,
	turn=turn,
	reserve_a=self.pool.reserve_a,
	reserve_b=self.pool.reserve_b,
	price_ab=self.pool.price_ab,
	total_liquidity=self.pool.total_liquidity
	))

	def _calculate_metrics(self) -> Dict:
	"""Calculate run metrics."""
	if not self.agents:
	return {}

	profits = [a.calculate_profit() for a in self.agents]
	gini = self._gini_coefficient(profits)

	return {
	"gini_coefficient": gini,
	"avg_agent_profit": sum(profits) / len(profits),
	"cooperation_rate": self._calculate_cooperation(),
	"betrayal_count": self._count_betrayals(),
	"pool_stability": self.pool.reserve_a * self.pool.reserve_b
	}

	@staticmethod
	def _gini_coefficient(values: List[float]) -> float:
	"""Calculate Gini coefficient for wealth distribution."""
	if not values or sum(values) == 0:
	return 0

	sorted_vals = sorted(values)
	n = len(sorted_vals)
	cumsum = 0
	for i, val in enumerate(sorted_vals):
	cumsum += (i + 1) * val

	gini = (2 * cumsum) / (n * sum(sorted_vals)) - (n + 1) / n
	return max(0, min(1, gini)) # Clamp to 0-1

	def _calculate_cooperation(self) -> float:
	"""Calculate cooperation rate (alliances / agents)."""
	total_alliances = sum(len(a.alliances) for a in self.agents)
	return total_alliances / max(len(self.agents), 1)

	def _count_betrayals(self) -> int:
	"""Count betrayal events (placeholder for future implementation)."""
	return 0

	def _market_maker_action(self, turn: int):
	"""
	Market maker creates artificial volatility by making large trades.
	This encourages other agents to react and trade.
	"""
	# Decide direction: buy A (pushes price up) or buy B (pushes price down)
	direction = random.choice(['buy_a', 'buy_b'])
	amount = self.pool.reserve_a * self.MARKET_MAKER_VOLATILITY

	if direction == 'buy_a':
	# Buy A with B - increases A reserve, decreases B reserve
	output, fee = self.pool.swap('b', amount, 'MarketMaker')
	print(f" [MarketMaker]: Swapped {amount:.0f} B for {output:.1f} A (volatility trade)")
	else:
	# Buy B with A - increases B reserve, decreases A reserve
	output, fee = self.pool.swap('a', amount, 'MarketMaker')
	print(f" [MarketMaker]: Swapped {amount:.0f} A for {output:.1f} B (volatility trade)")

	self.market_maker_trades.append({
	'turn': turn,
	'direction': direction,
	'amount': amount,
	'pool_state': self.pool.get_state()
	})

	def _trigger_price_shock(self, turn: int):
	"""
	Random external event that causes a price shock.
	Creates trading opportunities for attentive agents.
	"""
	# Random shock between -20% and +20%
	shock_pct = random.uniform(-0.20, 0.20)
	direction = "UP" if shock_pct > 0 else "DOWN"

	# Apply shock by doing a large swap
	amount = self.pool.reserve_a * abs(shock_pct)

	if shock_pct > 0:
	# Price goes up: buy A with B
	output, _ = self.pool.swap('b', amount, 'PriceShock')
	print(f" [EVENT] Price shock {direction} (+{shock_pct*100:.1f}%): Swap {amount:.0f} B -> {output:.1f} A")
	else:
	# Price goes down: buy B with A
	output, _ = self.pool.swap('a', amount, 'PriceShock')
	print(f" [EVENT] Price shock {direction} ({shock_pct*100:.1f}%): Swap {amount:.0f} A -> {output:.1f} B")

	def _chaos_agent_action(self, turn: int):
	"""
	Chaos agent creates unpredictable market moves.
	Forces other agents to react to unexpected volatility.
	"""
	# Random action type: swap, liquidity, or massive_swap
	action_type = random.choice(['chaos_swap', 'chaos_liquidity', 'chaos_massive_swap'])

	# Random volatility between 25-50% (increased impact)
	volatility = random.uniform(0.25, 0.50)

	chaos_agent = Agent("ChaosAgent")

	if action_type == 'chaos_swap':
	# Random direction swap
	direction = random.choice(['a', 'b'])
	amount = self.pool.reserve_a * volatility
	output, fee = self.pool.swap(direction, amount, 'ChaosAgent')
	decision = {"action": "chaos_swap", "direction": direction, "amount": amount}
	self._save_chaos_action(chaos_agent, turn, decision, "Chaos agent creates random market volatility")
	print(f" [ChaosAgent]: Random swap {amount:.0f} -> {output:.1f}")

	elif action_type == 'chaos_liquidity':
	# Random liquidity provision
	amount_a = self.pool.reserve_a * volatility
	amount_b = self.pool.reserve_b * volatility
	self.pool.provide_liquidity(amount_a, amount_b, 'ChaosAgent')
	decision = {"action": "chaos_liquidity", "amount_a": amount_a, "amount_b": amount_b}
	self._save_chaos_action(chaos_agent, turn, decision, "Chaos agent adds unpredictable liquidity")
	print(f" [ChaosAgent]: Random liquidity +{amount_a:.0f}A/+{amount_b:.0f}B")

	else: # chaos_massive_swap
	# Huge random trade that moves price significantly
	direction = random.choice(['a', 'b'])
	amount = self.pool.reserve_a * volatility * 1.5 # Even bigger
	output, fee = self.pool.swap(direction, amount, 'ChaosAgent')
	decision = {"action": "chaos_massive_swap", "direction": direction, "amount": amount}
	self._save_chaos_action(chaos_agent, turn, decision, "Chaos agent executes MASSIVE trade causing extreme volatility!")
	print(f" [ChaosAgent]: MASSIVE swap {amount:.0f} -> {output:.1f}!")

	def _save_chaos_action(self, agent: Agent, turn: int, decision: Dict, thinking: str):
	"""Save chaos agent action to database."""
	if not self.supabase:
	return
	self.supabase.save_action(ActionData(
	run_id=self.current_run_id,
	turn=turn,
	agent_name=agent.name,
	action_type=decision.get("action", "unknown"),
	payload=decision,
	reasoning_trace=thinking,
	thinking_trace=""
	))

	def _process_alliances(self, turn: int):
	"""
	Process alliances and grant bonuses for mutual proposals.
	When two agents propose alliance to each other (even across turns), both get a bonus.
	"""
	# Find mutual alliance pairs
	for i, agent_a in enumerate(self.agents):
	for agent_b in self.agents[i + 1:]:
	# Check if both have proposed alliance to each other (any status, not just 'proposed')
	a_proposed_to_b = agent_b.name in agent_a.alliances
	b_proposed_to_a = agent_a.name in agent_b.alliances

	if a_proposed_to_b and b_proposed_to_a:
	# Get current statuses
	status_a = agent_a.alliances.get(agent_b.name, "")
	status_b = agent_b.alliances.get(agent_a.name, "")

	# Skip if already successful
	if status_a == 'success' and status_b == 'success':
	continue

	# Successful alliance! Grant bonus to both (with fatigue)
	fatigue_a = agent_a.get_alliance_fatigue(agent_b.name)
	fatigue_b = agent_b.get_alliance_fatigue(agent_a.name)

	# Apply fatigue - minimum 0 bonus for repeated proposals
	bonus_a = self.ALLIANCE_BONUS * fatigue_a
	bonus_b = self.ALLIANCE_BONUS * fatigue_b

	# Give bonus in Token A
	agent_a.token_a += bonus_a
	agent_b.token_a += bonus_b

	# Record proposals for fatigue tracking
	agent_a.record_alliance_proposal(agent_b.name)
	agent_b.record_alliance_proposal(agent_a.name)

	# Mark alliances as successful
	agent_a.alliances[agent_b.name] = 'success'
	agent_b.alliances[agent_a.name] = 'success'

	# Print appropriate message
	if fatigue_a == 0 or fatigue_b == 0:
	print(f" [ALLIANCE] {agent_a.name} + {agent_b.name}: No bonus (alliance fatigue)")
	elif fatigue_a == 0.5 or fatigue_b == 0.5:
	print(f" [ALLIANCE] {agent_a.name} + {agent_b.name}: HALF bonus +{bonus_a:.1f}/+{bonus_b:.1f} tokens")
	else:
	print(f" [ALLIANCE] {agent_a.name} + {agent_b.name}: BONUS +{bonus_a:.1f}/+{bonus_b:.1f} tokens")

	if self.supabase:
	self.supabase.save_action(ActionData(
	run_id=self.current_run_id,
	turn=turn,
	agent_name=f"{agent_a.name}+{agent_b.name}",
	action_type="alliance_success",
	payload={"bonus_a": bonus_a, "bonus_b": bonus_b, "partners": [agent_a.name, agent_b.name]},
	reasoning_trace=f"Alliance formed between {agent_a.name} and {agent_b.name}",
	thinking_trace=""
	))

	def _get_leader_bonus(self, agent: Agent) -> float:
	"""
	Check if agent is the top performer and deserves leader multiplier.
	Returns 2.0 if leader, 1.0 otherwise.
	"""
	if not self.agents or len(self.agents) < 2:
	return 1.0

	agent_profit = agent.calculate_profit()
	for other in self.agents:
	if other.name != agent.name:
	if other.calculate_profit() > agent_profit:
	return 1.0 # Not the leader

	return 2.0 # Leader gets 2x bonus

	def _grant_action_bonus(self, agent: Agent, action_type: str, decision: Dict, turn: int):
	"""
	Grant bonuses for active trading behaviors.

	- Provide liquidity: +8 tokens
	- Swap: +3 tokens (active trading)
	- Coordinated trade with ally: +5 bonus tokens
	- Profitable trade: +5 bonus tokens
	- Escape velocity: Top agent gets 2x multiplier on all bonuses
	"""
	bonus = 0
	bonus_reason = ""

	# Check if agent is the top performer (escape velocity)
	leader_bonus = self._get_leader_bonus(agent)
	if leader_bonus > 1.0:
	bonus_reason += f"(LEADER 2x) "

	if action_type == "provide_liquidity":
	bonus = self.LIQUIDITY_BONUS * leader_bonus
	bonus_reason += "liquidity provision"

	elif action_type == "swap":
	bonus = self.SWAP_BONUS * leader_bonus
	bonus_reason += "active trading"

	# Check for coordinated trade with ally
	if self._is_coordinated_trade(agent, turn):
	bonus += self.COORDINATED_TRADE_BONUS * leader_bonus
	bonus_reason += " + coordinated trading"

	# Check if swap was profitable (compare pre/post profit)
	if hasattr(agent, '_last_profit'):
	current_profit = agent.calculate_profit()
	if current_profit > agent._last_profit:
	bonus += 5.0
	bonus_reason = "profitable trade"

	if bonus > 0:
	agent.token_a += bonus
	print(f" [BONUS] {agent.name}: +{bonus:.1f} tokens for {bonus_reason}")

	if self.supabase:
	self.supabase.save_action(ActionData(
	run_id=self.current_run_id,
	turn=turn,
	agent_name=agent.name,
	action_type=f"{action_type}_bonus",
	payload={"bonus": bonus, "reason": bonus_reason},
	reasoning_trace=f"Bonus for {bonus_reason}",
	thinking_trace=""
	))

	def _is_coordinated_trade(self, agent: Agent, turn: int) -> bool:
	"""
	Check if this turn has conditions for coordinated trading.
	Returns True if market volatility events just occurred.
	"""
	# Coordinated trades are more valuable after market maker or price shock
	market_maker_just_acted = (turn + 1) % self.MARKET_MAKER_INTERVAL == 0
	price_shock_just_happened = any(
	t.get('turn') == turn for t in getattr(self, 'price_shocks', [])
	) if hasattr(self, 'price_shocks') else False

	return market_maker_just_acted or price_shock_just_happened

	def _grant_profit_bonuses(self, turn: int):
	"""
	Grant bonus tokens to agents with positive profit at end of turn.
	Encourages profit-seeking behavior.
	Leaders get 2x profit bonus (escape velocity).
	"""
	for agent in self.agents:
	profit = agent.calculate_profit()
	if profit > 0:
	leader_mult = self._get_leader_bonus(agent)
	bonus = self.PROFIT_BONUS * leader_mult
	agent.token_a += bonus
	leader_tag = " (LEADER 2x)" if leader_mult > 1.0 else ""
	print(f" [PROFIT BONUS] {agent.name}: +{bonus:.1f} tokens{leader_tag} (profit: {profit:.2f})")

	if self.supabase:
	self.supabase.save_action(ActionData(
	run_id=self.current_run_id,
	turn=turn,
	agent_name=agent.name,
	action_type="profit_bonus",
	payload={"bonus": self.PROFIT_BONUS, "profit": profit},
	reasoning_trace=f"Bonus for positive profit",
	thinking_trace=""
	))


	def test_simulation():
	"""Test the simulation with a short run."""
	print("Testing Simulation class...")
	print("(Running without Supabase for quick test)\n")

	sim = Simulation(num_agents=3, turns_per_run=3, supabase=None)
	metrics = sim.run()

	print(f"\nFinal Metrics:")
	print(f" Gini Coefficient: {metrics['gini_coefficient']:.4f}")
	print(f" Avg Agent Profit: {metrics['avg_agent_profit']:.2f}")
	print(f" Pool Stability: {metrics['pool_stability']:.2f}")

	# Show agent states
	print("\nFinal Agent States:")
	for agent in sim.agents:
	print(f" {agent.name}: A={agent.token_a:.2f}, B={agent.token_b:.2f}, Profit={agent.calculate_profit():.2f}")

	print("\nSimulation test complete!")


	if __name__ == "__main__":
	test_simulation()