Spaces:

MGalli
/

AIWorld

Sleeping

App Files Files Community

AIWorld / app.py

MGalli

Update app.py

39762b2 verified 9 days ago

raw

history blame contribute delete

20 kB

	import os
	import json
	import random
	import threading
	import time
	from dataclasses import dataclass, asdict
	from typing import List, Tuple, Dict, Any, Optional

	import gradio as gr
	from transformers import AutoTokenizer, AutoModelForCausalLM


	# ==========================
	# CONFIGURAZIONE GLOBALE
	# ==========================

	DEFAULT_MODEL_ID = "Mattimax/DACMini-IT"
	DEFAULT_NUM_AGENTS = 5

	MEMORY_DIR = "memories"
	LOG_DIR = "logs"

	os.makedirs(MEMORY_DIR, exist_ok=True)
	os.makedirs(LOG_DIR, exist_ok=True)

	GRID_SIZE = 10 # griglia 10x10
	WORLD_SIZE_PX = 480 # dimensione SVG in pixel

	# Stato simulazione
	SIMULATION_RUNNING = True
	SIMULATION_DELAY = 1.0 # secondi tra uno step e l'altro


	# ==========================
	# CLASSI DI DOMINIO
	# ==========================

	@dataclass
	class Agent:
	agent_id: int
	name: str
	role: str
	interests: str
	memory_file: str
	x: int
	y: int
	lifetime_steps: int = 0
	total_reward: float = 0.0
	alive: bool = True
	last_action: str = ""
	last_reward: float = 0.0

	def to_dict(self) -> Dict[str, Any]:
	return asdict(self)

	def append_memory(self, text: str):
	with open(self.memory_file, "a", encoding="utf-8") as f:
	f.write(text + "\n")


	class World:
	def __init__(self, model_id: str = DEFAULT_MODEL_ID, num_agents: int = DEFAULT_NUM_AGENTS):
	self.model_id = model_id
	self.tokenizer, self.model = load_model(model_id)
	self.step = 0
	self.agents: List[Agent] = []
	self.initialize_agents(num_agents)

	def initialize_agents(self, num_agents: int):
	self.agents = []
	self.step = 0
	for i in range(num_agents):
	agent = self._create_random_agent(i)
	self.agents.append(agent)

	def _create_random_agent(self, idx: int) -> Agent:
	names = ["Astra", "Nexus", "Orion", "Lyra", "Helix", "Nova", "Echo", "Vega"]
	roles = ["Ricercatore", "Artista", "Esploratore", "Filosofo", "Ingegnere", "Narratore"]
	interests = [
	"intelligenza artificiale, etica, società",
	"arte generativa, musica, poesia",
	"esplorazione spaziale, mondi virtuali",
	"filosofia della mente, coscienza",
	"robotica, sistemi complessi",
	"storie, miti, narrazioni collettive",
	]

	name = random.choice(names) + f"_{idx}"
	role = random.choice(roles)
	intr = random.choice(interests)

	memory_file = os.path.join(MEMORY_DIR, f"agent_{idx}.txt")
	with open(memory_file, "w", encoding="utf-8") as f:
	f.write(f"Identità dell'agente {name}\n")
	f.write(f"Ruolo: {role}\n")
	f.write(f"Interessi: {intr}\n\n")

	x = random.randint(0, GRID_SIZE - 1)
	y = random.randint(0, GRID_SIZE - 1)

	return Agent(
	agent_id=idx,
	name=name,
	role=role,
	interests=intr,
	memory_file=memory_file,
	x=x,
	y=y,
	)

	def reset_world(self, num_agents: int, model_id: str):
	self.model_id = model_id
	self.tokenizer, self.model = load_model(model_id)
	self.initialize_agents(num_agents)

	def step_world(self) -> None:
	"""Esegue un tick di simulazione: ogni agente vivo genera un’azione e si muove."""
	self.step += 1
	world_state_summary = self._build_world_state_summary()

	for agent in self.agents:
	if not agent.alive:
	continue

	action = generate_action(
	agent=agent,
	world_state=world_state_summary,
	tokenizer=self.tokenizer,
	model=self.model,
	)

	self._update_agent_position(agent, action)

	reward = self.compute_reward(agent, action, world_state_summary)

	agent.last_action = action
	agent.last_reward = reward
	agent.lifetime_steps += 1
	agent.total_reward += reward

	mem_entry = f"[Step {self.step}] Pos=({agent.x},{agent.y}) Azione: {action} \| Reward: {reward:.3f}"
	agent.append_memory(mem_entry)

	self.log_transition(agent, action, reward)

	avg_reward = agent.total_reward / max(1, agent.lifetime_steps)
	if avg_reward < -0.2 or agent.lifetime_steps > 80:
	agent.alive = False

	for i, agent in enumerate(self.agents):
	if not agent.alive:
	self.agents[i] = self._create_random_agent(agent.agent_id)

	def _update_agent_position(self, agent: Agent, action: str):
	"""
	Movimento fisico:
	- se l’azione contiene parole chiave, muoviti in quella direzione
	- altrimenti random walk
	"""
	dx, dy = 0, 0
	text = action.lower()

	moved_by_text = False

	if "su" in text or "nord" in text:
	dy = -1
	moved_by_text = True
	elif "giu" in text or "giù" in text or "sud" in text:
	dy = 1
	moved_by_text = True
	elif "sinistra" in text or "ovest" in text:
	dx = -1
	moved_by_text = True
	elif "destra" in text or "est" in text:
	dx = 1
	moved_by_text = True
	elif "avvicino" in text or "raggiungo" in text:
	target = self._closest_agent(agent)
	if target is not None:
	moved_by_text = True
	if target.x > agent.x:
	dx = 1
	elif target.x < agent.x:
	dx = -1
	if target.y > agent.y:
	dy = 1
	elif target.y < agent.y:
	dy = -1

	if not moved_by_text:
	dx, dy = random.choice([(1, 0), (-1, 0), (0, 1), (0, -1), (0, 0)])

	new_x = max(0, min(GRID_SIZE - 1, agent.x + dx))
	new_y = max(0, min(GRID_SIZE - 1, agent.y + dy))
	agent.x = new_x
	agent.y = new_y

	def _closest_agent(self, agent: Agent) -> Optional[Agent]:
	others = [a for a in self.agents if a.agent_id != agent.agent_id and a.alive]
	if not others:
	return None
	best = None
	best_dist = 9999
	for o in others:
	d = abs(o.x - agent.x) + abs(o.y - agent.y)
	if d < best_dist:
	best_dist = d
	best = o
	return best

	def _build_world_state_summary(self) -> str:
	lines = [f"Step globale: {self.step}", "Stato degli agenti:"]
	for a in self.agents:
	status = "vivo" if a.alive else "morto"
	lines.append(
	f"- {a.name} ({a.role}), interessi: {a.interests}, "
	f"posizione: ({a.x},{a.y}), step di vita: {a.lifetime_steps}, "
	f"reward totale: {a.total_reward:.2f}, stato: {status}"
	)
	return "\n".join(lines)

	def compute_reward(self, agent: Agent, action: str, world_state: str) -> float:
	reward = 0.0
	length = len(action.strip())

	if length >= 20:
	reward += 1.0
	else:
	reward -= 0.5

	other_names = [a.name for a in self.agents if a.agent_id != agent.agent_id]
	if any(name in action for name in other_names):
	reward += 1.0

	text = action.lower()
	if any(k in text for k in ["cammino", "muovo", "sposto", "avvicino", "raggiungo", "esploro"]):
	reward += 0.5

	return reward

	def log_transition(self, agent: Agent, action: str, reward: float):
	log_path = os.path.join(LOG_DIR, f"agent_{agent.agent_id}_log.jsonl")
	transition = {
	"step": self.step,
	"agent_id": agent.agent_id,
	"name": agent.name,
	"role": agent.role,
	"interests": agent.interests,
	"x": agent.x,
	"y": agent.y,
	"action": action,
	"reward": reward,
	"lifetime_steps": agent.lifetime_steps,
	"total_reward": agent.total_reward,
	}
	with open(log_path, "a", encoding="utf-8") as f:
	f.write(json.dumps(transition, ensure_ascii=False) + "\n")


	# ==========================
	# MODELLO LLM
	# ==========================

	_model_cache: Dict[str, Tuple[Any, Any]] = {}


	def load_model(model_id: str) -> Tuple[Any, Any]:
	if model_id in _model_cache:
	return _model_cache[model_id]

	tokenizer = AutoTokenizer.from_pretrained(model_id)
	model = AutoModelForCausalLM.from_pretrained(model_id)

	_model_cache[model_id] = (tokenizer, model)
	return tokenizer, model


	def build_agent_prompt(agent: Agent, world_state: str) -> str:
	prompt = f"""
	Sei un agente in un mondo simulato su una griglia 2D.

	Identità:
	- Nome: {agent.name}
	- Ruolo: {agent.role}
	- Interessi: {agent.interests}

	Stato del mondo:
	{world_state}

	Compito:
	In una sola breve azione (1-3 frasi), descrivi cosa fai ora per interagire con questo mondo
	e con gli altri agenti. Puoi muoverti (su/giù/sinistra/destra), avvicinarti a qualcuno, esplorare, osservare.
	Sii coerente con il tuo ruolo e i tuoi interessi.

	Rispondi SOLO con l'azione, senza spiegazioni meta.
	"""
	return prompt.strip()


	def generate_action(agent: Agent, world_state: str, tokenizer, model) -> str:
	prompt = build_agent_prompt(agent, world_state)
	inputs = tokenizer(prompt, return_tensors="pt")
	outputs = model.generate(
	**inputs,
	max_new_tokens=80,
	do_sample=True,
	temperature=0.9,
	top_p=0.95,
	)
	text = tokenizer.decode(outputs[0], skip_special_tokens=True)
	if text.startswith(prompt):
	action = text[len(prompt):].strip()
	else:
	action = text.strip()
	return action


	# ==========================
	# RENDERING SVG + HTML
	# ==========================

	def world_to_svg(world: World) -> str:
	size = WORLD_SIZE_PX
	cell = size // GRID_SIZE

	# auto-refresh HTML/JS: ricarica la pagina ogni secondo
	refresh_js = """
	<script>
	if (typeof window !== 'undefined') {
	setTimeout(function() {
	window.location.reload();
	}, 1000);
	}
	</script>
	"""

	svg = [
	refresh_js,
	f'<svg width="{size}" height="{size}" viewBox="0 0 {size} {size}" '
	f'style="background:radial-gradient(circle at top,#0f172a,#020617);'
	f'border-radius:16px;border:1px solid #1f2937;box-shadow:0 18px 40px rgba(15,23,42,0.9);" '
	f'xmlns="http://www.w3.org/2000/svg">'
	]

	svg.append("""
	<style>
	.cell-line {
	stroke: #1f2937;
	stroke-width: 1;
	}
	.agent-node {
	stroke: #e5e7eb;
	stroke-width: 2;
	animation: pulse 2.4s ease-in-out infinite;
	}
	.agent-label {
	font-family: system-ui, -apple-system, BlinkMacSystemFont, "Segoe UI", sans-serif;
	font-size: 10px;
	fill: #e5e7eb;
	text-shadow: 0 0 4px rgba(15,23,42,0.9);
	}
	@keyframes pulse {
	0% { r: 0; opacity: 0; }
	30% { r: 6; opacity: 0.8; }
	100% { r: 10; opacity: 0; }
	}
	</style>
	""")

	for i in range(GRID_SIZE + 1):
	x = i * cell
	y = i * cell
	svg.append(
	f'<line x1="{x}" y1="0" x2="{x}" y2="{size}" class="cell-line" />'
	)
	svg.append(
	f'<line x1="0" y1="{y}" x2="{size}" y2="{y}" class="cell-line" />'
	)

	for agent in world.agents:
	ax = agent.x * cell
	ay = agent.y * cell
	cx = ax + cell / 2
	cy = ay + cell / 2

	base_color = "#22c55e" if agent.alive else "#f97316"

	svg.append(
	f'<circle cx="{cx}" cy="{cy}" r="{cell*0.35}" fill="{base_color}" '
	f'fill-opacity="0.25" />'
	)

	svg.append(
	f'<circle cx="{cx}" cy="{cy}" r="{cell*0.22}" fill="{base_color}" '
	f'class="agent-node" />'
	)

	svg.append(
	f'<text x="{cx}" y="{cy + cell*0.4}" text-anchor="middle" class="agent-label">'
	f'{agent.name}</text>'
	)

	svg.append("</svg>")
	return "".join(svg)


	def world_to_html_cards(world: World) -> str:
	css = """
	<style>
	body {
	font-family: system-ui, -apple-system, BlinkMacSystemFont, "Segoe UI", sans-serif;
	background: transparent;
	color: #f5f5f5;
	margin: 0;
	padding: 0;
	}
	.world-header {
	display: flex;
	justify-content: space-between;
	align-items: baseline;
	margin-bottom: 8px;
	}
	.world-title {
	font-size: 18px;
	font-weight: 600;
	}
	.world-subtitle {
	font-size: 12px;
	color: #a0aec0;
	}
	.agents-grid {
	display: grid;
	grid-template-columns: repeat(auto-fill, minmax(260px, 1fr));
	gap: 10px;
	}
	.agent-card {
	background: radial-gradient(circle at top left, #1f2937, #020617);
	border-radius: 10px;
	padding: 10px 12px;
	border: 1px solid rgba(148, 163, 184, 0.35);
	box-shadow: 0 8px 20px rgba(15, 23, 42, 0.8);
	}
	.agent-header {
	display: flex;
	justify-content: space-between;
	align-items: center;
	margin-bottom: 6px;
	}
	.agent-name {
	font-size: 16px;
	font-weight: 600;
	}
	.agent-role {
	font-size: 11px;
	color: #93c5fd;
	text-transform: uppercase;
	letter-spacing: 0.06em;
	}
	.agent-badge {
	padding: 3px 7px;
	border-radius: 999px;
	font-size: 10px;
	font-weight: 500;
	}
	.badge-alive {
	background: rgba(16, 185, 129, 0.15);
	color: #6ee7b7;
	border: 1px solid rgba(16, 185, 129, 0.6);
	}
	.badge-dead {
	background: rgba(248, 113, 113, 0.15);
	color: #fecaca;
	border: 1px solid rgba(248, 113, 113, 0.6);
	}
	.agent-meta {
	font-size: 11px;
	color: #e5e7eb;
	margin-bottom: 6px;
	}
	.agent-meta span {
	display: inline-block;
	margin-right: 8px;
	}
	.agent-interests {
	font-size: 11px;
	color: #9ca3af;
	margin-bottom: 6px;
	}
	.agent-action {
	font-size: 12px;
	color: #e5e7eb;
	background: rgba(15, 23, 42, 0.7);
	border-radius: 8px;
	padding: 6px;
	border: 1px solid rgba(55, 65, 81, 0.8);
	min-height: 32px;
	}
	.agent-action-label {
	font-size: 10px;
	text-transform: uppercase;
	letter-spacing: 0.08em;
	color: #9ca3af;
	margin-bottom: 3px;
	}
	</style>
	"""

	header = f"""
	<div class="world-header">
	<div>
	<div class="world-title">Mondo Simulato – Step {world.step}</div>
	<div class="world-subtitle">
	Modello: <code>{world.model_id}</code> · Agenti: {len(world.agents)}
	</div>
	</div>
	</div>
	"""

	cards = []
	for agent in world.agents:
	badge_class = "badge-alive" if agent.alive else "badge-dead"
	badge_text = "Vivo" if agent.alive else "Rinascita in corso"
	avg_reward = agent.total_reward / max(1, agent.lifetime_steps)
	card = f"""
	<div class="agent-card">
	<div class="agent-header">
	<div>
	<div class="agent-name">{agent.name}</div>
	<div class="agent-role">{agent.role}</div>
	</div>
	<div class="agent-badge {badge_class}">{badge_text}</div>
	</div>
	<div class="agent-meta">
	<span>Pos: <strong>({agent.x},{agent.y})</strong></span>
	<span>Step vita: <strong>{agent.lifetime_steps}</strong></span>
	<span>Reward tot: <strong>{agent.total_reward:.2f}</strong></span>
	<span>Reward medio: <strong>{avg_reward:.2f}</strong></span>
	</div>
	<div class="agent-interests">
	<strong>Interessi:</strong> {agent.interests}
	</div>
	<div class="agent-action">
	<div class="agent-action-label">Ultima azione</div>
	<div>{agent.last_action or "<i>Nessuna azione ancora.</i>"}</div>
	</div>
	</div>
	"""
	cards.append(card)

	grid = f'<div class="agents-grid">{"".join(cards)}</div>'

	return css + header + grid


	# ==========================
	# STATO & SIMULAZIONE
	# ==========================

	GLOBAL_WORLD: World = World(model_id=DEFAULT_MODEL_ID, num_agents=DEFAULT_NUM_AGENTS)


	def simulation_loop():
	global GLOBAL_WORLD, SIMULATION_RUNNING, SIMULATION_DELAY
	while True:
	if SIMULATION_RUNNING:
	GLOBAL_WORLD.step_world()
	time.sleep(max(0.1, SIMULATION_DELAY))


	def serialize_world(world: World) -> dict:
	return {
	"model_id": world.model_id,
	"step": world.step,
	"agents": [a.to_dict() for a in world.agents],
	}


	# ==========================
	# FUNZIONI GRADIO
	# ==========================

	def ui_refresh():
	svg = world_to_svg(GLOBAL_WORLD)
	html_cards = world_to_html_cards(GLOBAL_WORLD)
	state = serialize_world(GLOBAL_WORLD)
	return svg, html_cards, state


	def ui_reset(model_id: str, num_agents: int):
	global GLOBAL_WORLD
	GLOBAL_WORLD.reset_world(num_agents=num_agents, model_id=model_id)
	return ui_refresh()


	def ui_toggle_run(run: bool, delay: float):
	global SIMULATION_RUNNING, SIMULATION_DELAY
	SIMULATION_RUNNING = run
	SIMULATION_DELAY = delay
	return f"Simulazione: {'ON' if run else 'PAUSA'} · Delay: {delay:.2f}s"


	# ==========================
	# COSTRUZIONE INTERFACCIA
	# ==========================

	with gr.Blocks(title="AIWorld – Conway-Like LLM Life") as demo:
	gr.Markdown(
	"""
	# 🏆 AIWorld – Conway-Like LLM Life

	Un piccolo mondo simulato dove agenti LLM:
	- vivono su una griglia 2D,
	- hanno identità, ruoli, interessi e memoria,
	- generano azioni testuali,
	- si muovono nello spazio,
	- ricevono un reward semplice,
	- possono "morire" e rinascere con nuove identità.

	La simulazione gira in background in modo continuo.
	La vista si aggiorna automaticamente ogni ~1 secondo.
	"""
	)

	with gr.Row():
	with gr.Column(scale=1):
	model_id_in = gr.Textbox(
	label="Modello Hugging Face",
	value=DEFAULT_MODEL_ID,
	info="Esempio: Mattimax/DACMini-IT",
	)
	num_agents_in = gr.Slider(
	label="Numero di agenti",
	minimum=1,
	maximum=30,
	step=1,
	value=DEFAULT_NUM_AGENTS,
	)
	reset_btn = gr.Button("Reset mondo", variant="primary")

	run_toggle = gr.Checkbox(
	label="Simulazione in esecuzione",
	value=True,
	)
	delay_slider = gr.Slider(
	label="Delay tra step (secondi)",
	minimum=0.2,
	maximum=5.0,
	step=0.2,
	value=SIMULATION_DELAY,
	)
	status_text = gr.Markdown("Simulazione: ON")

	with gr.Column(scale=2):
	svg_out = gr.HTML(label="Mondo fisico (griglia)")
	html_out = gr.HTML(label="Dettagli agenti")
	state_out = gr.State(serialize_world(GLOBAL_WORLD))

	reset_btn.click(
	fn=ui_reset,
	inputs=[model_id_in, num_agents_in],
	outputs=[svg_out, html_out, state_out],
	)

	run_toggle.change(
	fn=ui_toggle_run,
	inputs=[run_toggle, delay_slider],
	outputs=[status_text],
	)

	delay_slider.change(
	fn=ui_toggle_run,
	inputs=[run_toggle, delay_slider],
	outputs=[status_text],
	)

	# avvio thread di simulazione in background
	threading.Thread(target=simulation_loop, daemon=True).start()

	if __name__ == "__main__":
	demo.launch()