#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
Play Catan with AI Agents (Manual Mode)
---------------------------------------
This script starts a Catan game where AI agents generate prompts
but YOU enter their moves manually. This is useful for:
- Testing the AI prompt system
- Understanding what the AI "sees"
- Debugging AI decision making
- Training data collection
How it works:
1. AI agents are registered for each player
2. When it's an AI player's turn, a prompt is generated and saved
3. You see the prompt info and enter what action the AI should take
4. The game executes that action
All prompts and interactions are logged for later analysis.
Usage:
python examples/ai_testing/play_with_ai.py
# Or with options:
python examples/ai_testing/play_with_ai.py --players 3 --auto-llm
"""
import sys
import os
import ssl
import json
import html as html_lib
from pathlib import Path
# Fix SSL certificate verification on Windows (must be before any other imports)
try:
import certifi
os.environ['SSL_CERT_FILE'] = certifi.where()
os.environ['REQUESTS_CA_BUNDLE'] = certifi.where()
os.environ['GRPC_DEFAULT_SSL_ROOTS_FILE_PATH'] = certifi.where()
ssl._create_default_https_context = ssl._create_unverified_context
except Exception:
pass
# Add parent directories to path for imports
sys.path.insert(0, str(Path(__file__).parent.parent.parent))
from typing import List, Optional, Dict, Any, Set
import webbrowser
import threading
import time
from http.server import BaseHTTPRequestHandler, ThreadingHTTPServer
from urllib.parse import parse_qs, urlparse
from pycatan.management.game_manager import GameManager
from pycatan.players.human_user import HumanUser
from pycatan.ai import AIManager, AIUser, AIConfig
from pycatan.ai.config import normalize_chat_language
from pycatan.visualizations.web_visualization import WebVisualization
from pycatan.visualizations.visualization import VisualizationManager
# Configure stdout for UTF-8 on Windows
import sys
import io
if sys.platform == 'win32':
sys.stdout = io.TextIOWrapper(sys.stdout.buffer, encoding='utf-8', errors='replace')
LOGS_DIR = Path("examples") / "ai_testing" / "my_games"
GEMINI_TEXT_MODELS = [
{
"id": "gemini-3-flash-preview",
"label": "Gemini 3 Flash Preview",
"note": "Recommended for this game: fast, capable, supports tools and structured JSON.",
},
{
"id": "gemini-3.1-pro-preview",
"label": "Gemini 3.1 Pro Preview",
"note": "Highest reasoning option; slower and usually more expensive.",
},
{
"id": "gemini-3.1-flash-lite",
"label": "Gemini 3.1 Flash-Lite",
"note": "Stable low-latency option for cheaper runs.",
},
{
"id": "gemini-3.1-flash-lite-preview",
"label": "Gemini 3.1 Flash-Lite Preview",
"note": "Preview low-latency option with structured output support.",
},
{
"id": "gemini-2.5-flash",
"label": "Gemini 2.5 Flash",
"note": "Stable price-performance model with tools and structured output.",
},
{
"id": "gemini-2.5-pro",
"label": "Gemini 2.5 Pro",
"note": "Stable stronger reasoning model.",
},
{
"id": "gemini-2.5-flash-lite",
"label": "Gemini 2.5 Flash-Lite",
"note": "Stable budget model.",
},
]
ELEVENLABS_TTS_MODELS = [
{
"id": "eleven_v3",
"label": "Eleven v3",
"note": "Best quality and Hebrew support; recommended for natural Hebrew table talk.",
},
{
"id": "eleven_multilingual_v2",
"label": "Eleven Multilingual v2",
"note": "Good multilingual quality; useful fallback if v3 is too slow or inconsistent.",
},
{
"id": "eleven_flash_v2_5",
"label": "Eleven Flash v2.5",
"note": "Fast and cheaper; best if you switch table talk back to English or another supported v2.5 language.",
},
{
"id": "eleven_turbo_v2_5",
"label": "Eleven Turbo v2.5",
"note": "Low-latency quality/speed balance; useful fallback for supported languages.",
},
]
DEFAULT_PLAYER_NAMES = ["Alice", "Bob", "Charlie", "Diana"]
PLAYER_COLORS = ["Red", "Blue", "White", "Orange"]
def resolve_session_path(session_ref: str) -> Path:
"""Resolve a replay session name/path."""
path = Path(session_ref)
if path.is_absolute() and path.exists():
return path
if path.exists():
return path
session_path = LOGS_DIR / session_ref
if session_path.exists():
return session_path
raise FileNotFoundError(f"Replay session not found: {session_ref}")
def _parse_replay_marker(value: Optional[str]) -> Optional[tuple[str, int]]:
"""Parse a replay marker in the form Player:request_number."""
if not value:
return None
if ":" not in value:
raise ValueError("Replay marker must be in the form Player:request_number")
player, request_number = value.split(":", 1)
return player.strip(), int(request_number.strip())
def _marker_matches(decision: Dict[str, Any], marker: tuple[str, int]) -> bool:
player_name, request_number = marker
return (
decision["player_name"].lower() == player_name.lower()
and decision["request_number"] == request_number
)
def _first_response_timestamp(player_dir: Path) -> str:
responses_dir = player_dir / "responses"
if not responses_dir.exists():
return ""
timestamps = []
for response_file in responses_dir.glob("response_*.json"):
try:
data = json.loads(response_file.read_text(encoding="utf-8"))
except Exception:
continue
if data.get("timestamp"):
timestamps.append(str(data["timestamp"]))
return min(timestamps) if timestamps else ""
def infer_players_from_session(session_dir: Path, _visited: Optional[Set[str]] = None) -> List[str]:
"""Infer player names from session folders, preserving original turn order when possible."""
_visited = _visited or set()
session_key = str(session_dir.resolve())
if session_key in _visited:
return []
_visited.add(session_key)
ignored = {"prompts", "responses", "intermediate"}
players = []
for child in sorted(session_dir.iterdir(), key=lambda p: p.name.lower()):
if child.is_dir() and child.name not in ignored:
if (child / "responses").exists() or (child / "prompts").exists():
players.append((child.name, _first_response_timestamp(child)))
# In setup, first response order is the player order. Fall back to name order for
# empty/incomplete folders.
players.sort(key=lambda item: (item[1] == "", item[1], item[0].lower()))
local_inferred = [name for name, _timestamp in players]
parent_inferred: List[str] = []
metadata_file = session_dir / "session_metadata.json"
if metadata_file.exists():
try:
metadata = json.loads(metadata_file.read_text(encoding="utf-8"))
except Exception:
metadata = {}
derived_from = metadata.get("derived_from")
if derived_from:
try:
parent_inferred = infer_players_from_session(resolve_session_path(derived_from), _visited)
except Exception:
parent_inferred = []
if parent_inferred:
merged = list(parent_inferred)
seen = {name.lower() for name in merged}
for name in local_inferred:
if name.lower() not in seen:
merged.append(name)
seen.add(name.lower())
return merged
return local_inferred
def infer_players_from_decisions(decisions: List[Dict[str, Any]]) -> List[str]:
"""Infer player names from loaded replay decisions when session folders are absent."""
players: List[str] = []
seen = set()
for decision in decisions:
player_name = decision.get("player_name")
if player_name and player_name.lower() not in seen:
players.append(player_name)
seen.add(player_name.lower())
return players
def load_replay_decisions(
session_dir: Path,
max_decisions: Optional[int] = None,
replay_through: Optional[str] = None,
replay_stop_before: Optional[str] = None
) -> List[Dict[str, Any]]:
"""Load parsed final responses from a previous session in chronological order."""
through_marker = _parse_replay_marker(replay_through)
stop_before_marker = _parse_replay_marker(replay_stop_before)
decisions = []
for player_dir in session_dir.iterdir():
responses_dir = player_dir / "responses"
if not responses_dir.exists():
continue
for response_file in responses_dir.glob("response_*.json"):
if response_file.parent.name == "intermediate":
continue
try:
data = json.loads(response_file.read_text(encoding="utf-8"))
except Exception:
continue
parsed = data.get("parsed")
if not parsed or not parsed.get("action_type"):
continue
decisions.append({
"player_name": data.get("player_name") or player_dir.name,
"request_number": int(data.get("request_number", 0)),
"timestamp": data.get("timestamp", ""),
"parsed": parsed,
"source_file": str(response_file),
})
decisions.sort(key=lambda item: (item.get("timestamp", ""), item.get("player_name", ""), item.get("request_number", 0)))
for marker_name, marker in [("replay-through", through_marker), ("replay-stop-before", stop_before_marker)]:
if marker and not any(_marker_matches(decision, marker) for decision in decisions):
raise ValueError(
f"{marker_name} marker not found in session: {marker[0]}:{marker[1]}"
)
selected = []
for decision in decisions:
if stop_before_marker and _marker_matches(decision, stop_before_marker):
break
selected.append(decision)
if through_marker and _marker_matches(decision, through_marker):
break
if max_decisions and len(selected) >= max_decisions:
break
return selected
def load_replay_decision_chain(
session_dir: Path,
max_decisions: Optional[int] = None,
replay_through: Optional[str] = None,
replay_stop_before: Optional[str] = None,
_visited: Optional[Set[str]] = None
) -> List[Dict[str, Any]]:
"""
Load replay decisions needed to reconstruct a session.
Derived sessions only contain the live decisions made after their own replay
prefix. To replay from a derived session, first replay its lineage metadata,
then append this session's local decisions.
"""
_visited = _visited or set()
session_key = str(session_dir.resolve())
if session_key in _visited:
raise ValueError(f"Replay lineage cycle detected at {session_dir}")
_visited.add(session_key)
prefix: List[Dict[str, Any]] = []
metadata_file = session_dir / "session_metadata.json"
if metadata_file.exists():
try:
metadata = json.loads(metadata_file.read_text(encoding="utf-8"))
except Exception:
metadata = {}
derived_from = metadata.get("derived_from")
replay_meta = metadata.get("replay") or {}
if derived_from:
parent_session = resolve_session_path(derived_from)
prefix = load_replay_decision_chain(
parent_session,
replay_through=replay_meta.get("replay_through"),
replay_stop_before=replay_meta.get("replay_stop_before"),
_visited=_visited
)
local = load_replay_decisions(
session_dir,
replay_through=replay_through,
replay_stop_before=replay_stop_before
)
decisions = prefix + local
if max_decisions:
decisions = decisions[:max_decisions]
return decisions
def group_replay_decisions(decisions: List[Dict[str, Any]]) -> Dict[str, List[Dict[str, Any]]]:
"""Group replay decisions by player, preserving chronological order per player."""
grouped: Dict[str, List[Dict[str, Any]]] = {}
for decision in decisions:
grouped.setdefault(decision["player_name"], []).append(decision)
return grouped
def list_replay_marker_options(session_dir: Path) -> List[Dict[str, str]]:
"""Return replay markers that are valid for this selected session."""
options = []
for decision in load_replay_decisions(session_dir):
marker = f"{decision['player_name']}:{decision['request_number']}"
action_type = decision.get("parsed", {}).get("action_type", "")
options.append({
"value": marker,
"label": f"{marker} - {action_type}",
"action_type": action_type,
})
return options
class ReplayExhausted(Exception):
"""Raised by watch-only replay when no recorded decision exists."""
def annotate_replay_session(
ai_manager: AIManager,
source_session: Path,
decisions: List[Dict[str, Any]],
replay_through: Optional[str],
replay_stop_before: Optional[str],
mode: str = "fast_action_replay_then_live_ai"
) -> None:
"""Write lineage metadata into the newly created session."""
metadata_file = ai_manager.get_session_path() / "session_metadata.json"
metadata = {}
if metadata_file.exists():
metadata = json.loads(metadata_file.read_text(encoding="utf-8"))
metadata["derived_from"] = str(source_session)
metadata["replay"] = {
"source_session": source_session.name,
"decisions_loaded": len(decisions),
"replay_through": replay_through,
"replay_stop_before": replay_stop_before,
"mode": mode,
}
metadata_file.write_text(json.dumps(metadata, indent=2, ensure_ascii=False), encoding="utf-8")
class ReplayAIUser(AIUser):
"""AI user that first replays recorded parsed decisions, then falls back to live AI."""
def __init__(
self,
name: str,
user_id: int,
ai_manager: AIManager,
color: str = "",
replay_decisions: Optional[List[Dict[str, Any]]] = None,
replay_chat: bool = True,
replay_speak: bool = False,
replay_only: bool = False
):
super().__init__(name=name, user_id=user_id, ai_manager=ai_manager, color=color)
self.replay_decisions = list(replay_decisions or [])
self.replay_chat = replay_chat
self.replay_speak = replay_speak
self.replay_only = replay_only
self.last_replay_item: Optional[Dict[str, Any]] = None
def get_input(self, game_state, prompt_message: str, allowed_actions: Optional[List[str]] = None):
if self.replay_decisions:
replay_item = self.replay_decisions[0]
decision = dict(replay_item["parsed"])
action = self._decision_to_action(decision, allowed_actions)
if hasattr(action, "parameters") and isinstance(action.parameters, dict):
action.parameters.pop("_ai_say_outloud", None)
action.parameters["_ai_replay"] = True
if allowed_actions and action.action_type.name not in allowed_actions:
if self.replay_only:
raise ReplayExhausted(
f"{self.name} #{replay_item['request_number']} no longer matches "
f"allowed actions {allowed_actions}"
)
print(
f"[REPLAY] {self.name} #{replay_item['request_number']} no longer matches "
f"allowed actions {allowed_actions}; switching {self.name} to live AI."
)
self.replay_decisions.clear()
return super().get_input(game_state, prompt_message, allowed_actions)
self.last_replay_item = self.replay_decisions.pop(0)
self._apply_replay_memory_and_chat(decision, game_state)
print(
f"[REPLAY] {self.name} #{replay_item['request_number']}: "
f"{decision.get('action_type')} {decision.get('parameters', {})}"
)
return action
if self.replay_only:
raise ReplayExhausted(f"No more recorded replay decisions for {self.name}")
return super().get_input(game_state, prompt_message, allowed_actions)
def _apply_replay_memory_and_chat(
self,
decision: Dict[str, Any],
game_state: Optional[Dict[str, Any]] = None
) -> None:
agent = self.ai_manager.agents.get(self.name)
note_to_self = decision.get("note_to_self")
if agent and note_to_self:
agent.update_memory(note_to_self)
self.ai_manager._maybe_compact_agent_memory(agent, game_state)
self.ai_manager.logger.save_agent_memories(self.ai_manager.agents)
say_outloud = decision.get("say_outloud")
if self.replay_chat and say_outloud:
self.ai_manager._broadcast_chat(
self.name,
say_outloud,
speak=self.replay_speak
)
def load_env_file(env_path: Path = Path(".env")) -> None:
"""Load simple KEY=VALUE entries from .env without requiring python-dotenv."""
if not env_path.exists():
return
for raw_line in env_path.read_text(encoding="utf-8").splitlines():
line = raw_line.strip()
if not line or line.startswith("#") or "=" not in line:
continue
key, value = line.split("=", 1)
key = key.strip()
value = value.strip().strip('"').strip("'")
if key and key not in os.environ:
os.environ[key] = value
def load_ai_config(config_path: Optional[str] = None) -> AIConfig:
"""Load explicit config, then config_dev.yaml, then defaults."""
if config_path:
return AIConfig.from_file(config_path)
default_config = Path("pycatan") / "ai" / "config_dev.yaml"
if default_config.exists():
return AIConfig.from_file(str(default_config))
return AIConfig()
def _render_browser_settings_page(
errors: Optional[List[str]] = None,
selected_model: str = "gemini-3-flash-preview",
selected_chat_language: str = "english",
selected_tts_provider: str = "gemini",
selected_tts_model: str = "eleven_v3",
selected_gemini_tts_model: str = "gemini-2.5-flash-preview-tts",
selected_gemini_tts_voice: str = "Kore",
player_count: int = 3,
player_names: Optional[List[str]] = None,
selected_run_mode: str = "new_game",
selected_replay_session: str = "",
selected_replay_max_decisions: str = "",
selected_replay_through: str = "",
selected_replay_stop_before: str = "",
selected_replay_skip_chat: bool = False,
selected_replay_delay: str = "2.5",
selected_replay_text_lead: str = "0.25",
selected_replay_speak: bool = False,
selected_no_llm: bool = False,
selected_reaction_mode: str = "default",
selected_reaction_batch_size: str = "",
selected_config_path: str = "",
selected_random_seed: str = "",
selected_game_context: str = "",
key_mode: str = "env",
gemini_env_available: bool = False,
elevenlabs_env_available: bool = False,
elevenlabs_voice_env_available: bool = False
) -> str:
"""Render the temporary browser setup form."""
player_names = player_names or DEFAULT_PLAYER_NAMES
errors_html = ""
if errors:
error_items = "".join(f"
{html_lib.escape(error)}
" for error in errors)
errors_html = f"
{error_items}
"
use_env_keys = key_mode == "env"
gemini_key_required = "" if use_env_keys and gemini_env_available else " required"
elevenlabs_key_required = "" if use_env_keys and elevenlabs_env_available else " required"
elevenlabs_voice_required = "" if use_env_keys and elevenlabs_voice_env_available else " required"
gemini_key_hint = (
"Using GEMINI_API_KEY from environment if this is left blank."
if use_env_keys and gemini_env_available
else "Enter a Gemini API key for this run."
)
elevenlabs_key_hint = (
"Using ELEVENLABS_API_KEY from environment if this is left blank."
if use_env_keys and elevenlabs_env_available
else "Enter an ElevenLabs API key when ElevenLabs voice is selected."
)
elevenlabs_voice_hint = (
"Using ELEVENLABS_DEFAULT_VOICE_ID from environment if this is left blank."
if use_env_keys and elevenlabs_voice_env_available
else "Enter the default ElevenLabs voice ID for this run."
)
key_mode_label = "Environment keys" if use_env_keys else "Ask for keys"
recent_session_options = []
if LOGS_DIR.exists():
recent_sessions = sorted(
[path.name for path in LOGS_DIR.iterdir() if path.is_dir() and path.name.startswith("session_")],
reverse=True
)[:30]
recent_session_options = [
f""
for session_name in recent_sessions
]
model_options = []
for model in GEMINI_TEXT_MODELS:
selected = " selected" if model["id"] == selected_model else ""
model_options.append(
f""
)
model_notes = "".join(
"
"
for model in GEMINI_TEXT_MODELS
)
tts_model_options = []
for model in ELEVENLABS_TTS_MODELS:
selected = " selected" if model["id"] == selected_tts_model else ""
tts_model_options.append(
f""
)
tts_model_notes = "".join(
"
"
for model in ELEVENLABS_TTS_MODELS
)
gemini_tts_models = [
"gemini-2.5-flash-preview-tts",
"gemini-2.5-pro-preview-tts",
"gemini-3.1-flash-tts-preview",
"gemini-3.1-pro-tts-preview",
]
gemini_tts_model_options = []
for model_id in gemini_tts_models:
selected = " selected" if model_id == selected_gemini_tts_model else ""
gemini_tts_model_options.append(
f""
)
gemini_tts_voices = [
"Kore", "Puck", "Zephyr", "Charon", "Fenrir", "Leda", "Orus",
"Aoede", "Callirrhoe", "Autonoe", "Enceladus", "Iapetus",
"Umbriel", "Algieba", "Despina", "Erinome", "Algenib",
"Rasalgethi", "Laomedeia", "Achernar", "Alnilam", "Schedar",
"Gacrux", "Pulcherrima", "Achird", "Zubenelgenubi",
"Vindemiatrix", "Sadachbia", "Sadaltager", "Sulafat",
]
gemini_tts_voice_options = []
for voice in gemini_tts_voices:
selected = " selected" if voice == selected_gemini_tts_voice else ""
gemini_tts_voice_options.append(
f""
)
player_inputs = []
for index in range(4):
value = player_names[index] if index < len(player_names) and player_names[index] else DEFAULT_PLAYER_NAMES[index]
player_inputs.append(
f"""
"""
)
return f"""
PyCatan AI Setup
PyCatan AI Setup
Choose the Gemini model, configure keys, then set the AI players for this run.
Key mode: {html_lib.escape(key_mode_label)}
{errors_html}
"""
def _render_game_starting_page(model: str, player_names: List[str]) -> bytes:
"""Render the post-submit page while the real game server starts."""
safe_model = html_lib.escape(model)
safe_players = html_lib.escape(", ".join(player_names))
return f"""
Starting PyCatan
Starting game...
Model: {safe_model}
Players: {safe_players}
The board will open here as soon as the game server is ready.
""".encode("utf-8")
def collect_browser_settings(port: int = 5000, key_mode: str = "env") -> Dict[str, Any]:
"""Open a temporary localhost setup page and wait for the selected run settings."""
settings: Dict[str, Any] = {}
settings_ready = threading.Event()
valid_models = {model["id"] for model in GEMINI_TEXT_MODELS}
valid_chat_languages = {"english", "hebrew"}
valid_tts_models = {model["id"] for model in ELEVENLABS_TTS_MODELS}
valid_tts_providers = {"off", "gemini", "elevenlabs"}
valid_run_modes = {"new_game", "resume_session", "watch_replay", "analyse_game"}
valid_reaction_modes = {"default", "off", "sync", "async"}
valid_gemini_tts_models = {
"gemini-2.5-flash-preview-tts",
"gemini-2.5-pro-preview-tts",
"gemini-3.1-flash-tts-preview",
"gemini-3.1-pro-tts-preview",
}
use_env_keys = key_mode == "env"
def env_has(name: str) -> bool:
return bool(os.environ.get(name))
def render_settings_page(**kwargs) -> str:
return _render_browser_settings_page(
key_mode=key_mode,
gemini_env_available=env_has("GEMINI_API_KEY"),
elevenlabs_env_available=env_has("ELEVENLABS_API_KEY"),
elevenlabs_voice_env_available=env_has("ELEVENLABS_DEFAULT_VOICE_ID"),
**kwargs
)
class ReusableThreadingHTTPServer(ThreadingHTTPServer):
allow_reuse_address = True
class SettingsHandler(BaseHTTPRequestHandler):
def log_message(self, format, *args):
return
def _send_html(self, body: Any, status: int = 200) -> None:
body_bytes = body if isinstance(body, bytes) else body.encode("utf-8")
self.send_response(status)
self.send_header("Content-Type", "text/html; charset=utf-8")
self.send_header("Content-Length", str(len(body_bytes)))
self.end_headers()
self.wfile.write(body_bytes)
def _send_json(self, payload: Dict[str, Any], status: int = 200) -> None:
body_bytes = json.dumps(payload).encode("utf-8")
self.send_response(status)
self.send_header("Content-Type", "application/json; charset=utf-8")
self.send_header("Content-Length", str(len(body_bytes)))
self.end_headers()
self.wfile.write(body_bytes)
def do_GET(self):
parsed_url = urlparse(self.path)
if parsed_url.path == "/replay-markers":
query = parse_qs(parsed_url.query)
session_ref = query.get("session", [""])[0].strip()
if not session_ref:
self._send_json({"markers": []})
return
try:
session_dir = resolve_session_path(session_ref)
markers = list_replay_marker_options(session_dir)
except Exception as exc:
self._send_json({"error": str(exc), "markers": []}, status=400)
return
self._send_json({"markers": markers})
return
if parsed_url.path not in ("/", "/settings"):
self.send_response(302)
self.send_header("Location", "/settings")
self.end_headers()
return
self._send_html(render_settings_page())
def do_POST(self):
if self.path != "/start":
self.send_error(404)
return
length = int(self.headers.get("Content-Length", "0"))
fields = parse_qs(self.rfile.read(length).decode("utf-8"), keep_blank_values=True)
selected_model = fields.get("model", [""])[0].strip()
chat_language = normalize_chat_language(fields.get("chat_language", ["english"])[0])
api_key = fields.get("api_key", [""])[0].strip()
run_mode = fields.get("run_mode", ["new_game"])[0].strip()
replay_session = fields.get("replay_session", [""])[0].strip()
replay_max_decisions_raw = fields.get("replay_max_decisions", [""])[0].strip()
replay_through = fields.get("replay_through", [""])[0].strip()
replay_stop_before = fields.get("replay_stop_before", [""])[0].strip()
replay_skip_chat = "replay_skip_chat" in fields
replay_delay_raw = fields.get("replay_delay", ["2.5"])[0].strip() or "2.5"
replay_text_lead_raw = fields.get("replay_text_lead", ["0.25"])[0].strip() or "0.25"
replay_speak = "replay_speak" in fields
no_llm = "no_llm" in fields
reaction_mode = fields.get("reaction_mode", ["default"])[0].strip()
reaction_batch_size_raw = fields.get("reaction_batch_size", [""])[0].strip()
config_path = fields.get("config_path", [""])[0].strip()
random_seed_raw = fields.get("random_seed", [""])[0].strip()
game_context = fields.get("game_context", [""])[0].strip()
tts_provider = fields.get("tts_provider", ["gemini"])[0].strip()
gemini_tts_model = fields.get("gemini_tts_model", ["gemini-2.5-flash-preview-tts"])[0].strip()
gemini_tts_voice = fields.get("gemini_tts_voice", ["Kore"])[0].strip()
elevenlabs_tts_model = fields.get("elevenlabs_tts_model", ["eleven_v3"])[0].strip()
elevenlabs_api_key = fields.get("elevenlabs_api_key", [""])[0].strip()
elevenlabs_default_voice_id = fields.get("elevenlabs_default_voice_id", [""])[0].strip()
effective_api_key = api_key or (os.environ.get("GEMINI_API_KEY", "") if use_env_keys else "")
effective_elevenlabs_api_key = elevenlabs_api_key or (os.environ.get("ELEVENLABS_API_KEY", "") if use_env_keys else "")
effective_elevenlabs_voice_id = elevenlabs_default_voice_id or (os.environ.get("ELEVENLABS_DEFAULT_VOICE_ID", "") if use_env_keys else "")
player_count_raw = fields.get("player_count", ["3"])[0].strip()
names = [
fields.get(f"player_{index + 1}", [DEFAULT_PLAYER_NAMES[index]])[0].strip()
for index in range(4)
]
errors = []
if selected_model not in valid_models:
errors.append("Choose one of the available Gemini text models.")
if chat_language not in valid_chat_languages:
errors.append("Choose English or Hebrew for table talk.")
if run_mode not in valid_run_modes:
errors.append("Choose a valid run mode.")
needs_session = run_mode in {"resume_session", "watch_replay", "analyse_game"}
if needs_session and not replay_session:
errors.append("Choose a recorded session for replay/resume/analyse mode.")
if replay_through and replay_stop_before:
errors.append("Use either replay-through or replay-stop-before, not both.")
replay_session_path_for_validation = None
if needs_session and replay_session:
try:
replay_session_path_for_validation = resolve_session_path(replay_session)
except FileNotFoundError as exc:
errors.append(str(exc))
if replay_session_path_for_validation and (replay_through or replay_stop_before):
try:
load_replay_decisions(
replay_session_path_for_validation,
replay_through=replay_through or None,
replay_stop_before=replay_stop_before or None
)
except (TypeError, ValueError) as exc:
errors.append(
f"{exc}. Choose one of the suggested action markers; reaction-only table talk is not replayable as a marker."
)
if reaction_mode not in valid_reaction_modes:
errors.append("Choose a valid reaction mode.")
if config_path and not Path(config_path).exists():
errors.append("Config file was not found.")
if len(game_context) > 4000:
errors.append("Additional game context must be 4000 characters or less.")
replay_max_decisions = None
if replay_max_decisions_raw:
try:
replay_max_decisions = int(replay_max_decisions_raw)
if replay_max_decisions < 1:
errors.append("Replay max decisions must be at least 1.")
except ValueError:
errors.append("Replay max decisions must be a number.")
try:
replay_delay = float(replay_delay_raw)
if replay_delay < 0:
errors.append("Replay delay cannot be negative.")
except ValueError:
replay_delay = 2.5
errors.append("Replay delay must be a number.")
try:
replay_text_lead = float(replay_text_lead_raw)
if replay_text_lead < 0:
errors.append("Replay text lead cannot be negative.")
except ValueError:
replay_text_lead = 0.25
errors.append("Replay text lead must be a number.")
reaction_batch_size = None
if reaction_batch_size_raw:
try:
reaction_batch_size = int(reaction_batch_size_raw)
if reaction_batch_size < 1:
errors.append("Reaction batch size must be at least 1.")
except ValueError:
errors.append("Reaction batch size must be a number.")
random_seed = 0
if random_seed_raw:
try:
random_seed = int(random_seed_raw)
except ValueError:
errors.append("Random seed must be a whole number.")
live_mode = run_mode in {"new_game", "resume_session"}
needs_gemini_key = (live_mode and not no_llm) or (tts_provider == "gemini" and (live_mode or replay_speak))
if needs_gemini_key and not effective_api_key:
errors.append("Enter a Gemini API key or run with --use-env-keys after setting GEMINI_API_KEY.")
if tts_provider not in valid_tts_providers:
errors.append("Choose a valid voice provider.")
if tts_provider == "gemini":
if gemini_tts_model not in valid_gemini_tts_models:
errors.append("Choose one of the available Gemini speech models.")
if not gemini_tts_voice:
errors.append("Choose a Gemini voice.")
if tts_provider == "elevenlabs":
if elevenlabs_tts_model not in valid_tts_models:
errors.append("Choose one of the available ElevenLabs speech models.")
if (live_mode or replay_speak) and not effective_elevenlabs_api_key:
errors.append("Enter an ElevenLabs API key or set ELEVENLABS_API_KEY.")
if (live_mode or replay_speak) and not effective_elevenlabs_voice_id:
errors.append("Enter an ElevenLabs default voice ID or set ELEVENLABS_DEFAULT_VOICE_ID.")
try:
player_count = int(player_count_raw)
except ValueError:
player_count = 3
errors.append("Choose 2, 3, or 4 players.")
if player_count not in (2, 3, 4):
errors.append("Choose 2, 3, or 4 players.")
selected_names = names[:player_count]
if run_mode == "new_game":
for index, name in enumerate(selected_names):
if not name:
errors.append(f"Player {index + 1} needs a name.")
lowered_names = [name.lower() for name in selected_names if name]
if len(lowered_names) != len(set(lowered_names)):
errors.append("Player names must be unique.")
if errors:
self._send_html(
render_settings_page(
errors=errors,
selected_model=selected_model if selected_model in valid_models else "gemini-3-flash-preview",
selected_chat_language=chat_language if chat_language in valid_chat_languages else "english",
selected_tts_provider=tts_provider if tts_provider in valid_tts_providers else "gemini",
selected_tts_model=elevenlabs_tts_model if elevenlabs_tts_model in valid_tts_models else "eleven_v3",
selected_gemini_tts_model=gemini_tts_model if gemini_tts_model in valid_gemini_tts_models else "gemini-2.5-flash-preview-tts",
selected_gemini_tts_voice=gemini_tts_voice or "Kore",
player_count=player_count if player_count in (2, 3, 4) else 3,
player_names=names,
selected_run_mode=run_mode if run_mode in valid_run_modes else "new_game",
selected_replay_session=replay_session,
selected_replay_max_decisions=replay_max_decisions_raw,
selected_replay_through=replay_through,
selected_replay_stop_before=replay_stop_before,
selected_replay_skip_chat=replay_skip_chat,
selected_replay_delay=replay_delay_raw,
selected_replay_text_lead=replay_text_lead_raw,
selected_replay_speak=replay_speak,
selected_no_llm=no_llm,
selected_reaction_mode=reaction_mode if reaction_mode in valid_reaction_modes else "default",
selected_reaction_batch_size=reaction_batch_size_raw,
selected_config_path=config_path,
selected_random_seed=random_seed_raw,
selected_game_context=game_context
),
status=400
)
return
settings.update({
"model": selected_model,
"chat_language": chat_language,
"api_key": effective_api_key,
"tts_provider": tts_provider,
"gemini_tts_model": gemini_tts_model,
"gemini_tts_voice": gemini_tts_voice,
"elevenlabs_api_key": effective_elevenlabs_api_key,
"elevenlabs_default_voice_id": effective_elevenlabs_voice_id,
"elevenlabs_tts_model": elevenlabs_tts_model,
"run_mode": run_mode,
"replay_session": replay_session,
"replay_max_decisions": replay_max_decisions,
"replay_through": replay_through or None,
"replay_stop_before": replay_stop_before or None,
"replay_skip_chat": replay_skip_chat,
"replay_delay": replay_delay,
"replay_text_lead": replay_text_lead,
"replay_speak": replay_speak,
"no_llm": no_llm,
"reaction_mode": reaction_mode,
"reaction_batch_size": reaction_batch_size,
"config_path": config_path or None,
"random_seed": random_seed,
"game_context": game_context,
"player_configs": [
{"name": selected_names[index], "is_ai": True, "color": PLAYER_COLORS[index]}
for index in range(player_count)
] if run_mode == "new_game" else [],
})
starting_names = selected_names if run_mode == "new_game" else [replay_session]
self._send_html(_render_game_starting_page(selected_model, starting_names))
settings_ready.set()
server = ReusableThreadingHTTPServer(("127.0.0.1", port), SettingsHandler)
server_thread = threading.Thread(target=server.serve_forever, daemon=True)
server_thread.start()
setup_url = f"http://localhost:{port}/settings"
print(f"[SETUP] Browser settings page: {setup_url}")
try:
webbrowser.open(setup_url)
except Exception as exc:
print(f"[SETUP] Could not open browser automatically: {exc}")
print(f"[SETUP] Open this URL manually: {setup_url}")
print("[SETUP] Waiting for browser settings...")
try:
while not settings_ready.wait(timeout=0.25):
pass
except KeyboardInterrupt:
server.shutdown()
server.server_close()
raise
server.shutdown()
server.server_close()
server_thread.join(timeout=2)
return settings
def print_banner():
"""Print the welcome banner."""
print("=" * 70)
print("[AI] PYCATAN WITH AI AGENTS")
print("=" * 70)
print()
print("All players are AI - you enter their moves manually.")
print()
def setup_game() -> tuple:
"""
Simple setup - ask how many players and their names.
All players are AI agents (manual input mode).
Returns:
Tuple of (num_players, player_configs)
"""
print_banner()
# Default player colors and names
colors = ["Red", "Blue", "White", "Orange"]
default_names = ["Alice", "Bob", "Charlie", "Diana"]
# Get number of players
while True:
try:
num_str = input("How many players? (2-4) [3]: ").strip()
if not num_str:
num_players = 3
else:
num_players = int(num_str)
if 2 <= num_players <= 4:
break
else:
print("Enter 2-4")
except ValueError:
print("Enter a number")
# Get player names
print(f"\nEnter names (or press Enter for default):")
player_configs = []
for i in range(num_players):
name = input(f" Player {i+1} ({colors[i]}) [{default_names[i]}]: ").strip()
if not name:
name = default_names[i]
player_configs.append({
"name": name,
"is_ai": True,
"color": colors[i]
})
# Brief summary
names = [p["name"] for p in player_configs]
print(f"\nPlayers: {', '.join(names)}")
print()
return num_players, player_configs
def create_game(
player_configs: List[dict],
send_to_llm: bool = True,
manual_actions: bool = True,
config: Optional[AIConfig] = None,
replay_decisions: Optional[Dict[str, List[Dict[str, Any]]]] = None,
replay_chat: bool = True,
replay_speak: bool = False,
replay_only: bool = False,
web_port: int = 5000,
random_seed: Optional[int] = 0,
game_config: Optional[Dict[str, Any]] = None
) -> tuple:
"""
Create the game with configured players.
Args:
player_configs: List of player configuration dicts
send_to_llm: If True, sends prompts to LLM (shows suggestions)
manual_actions: If True, user enters actions manually
Returns:
Tuple of (game_manager, ai_manager, web_viz)
"""
# Create AIManager (shared between all AI players)
ai_manager = AIManager(
config=config or AIConfig(),
send_to_llm=send_to_llm,
manual_actions=manual_actions
)
# Create user objects
users = []
replay_decisions = replay_decisions or {}
for i, cfg in enumerate(player_configs):
if cfg["is_ai"]:
if cfg["name"] in replay_decisions:
user = ReplayAIUser(
name=cfg["name"],
user_id=i,
ai_manager=ai_manager,
color=cfg["color"],
replay_decisions=replay_decisions[cfg["name"]],
replay_chat=replay_chat,
replay_speak=replay_speak,
replay_only=replay_only
)
else:
# Create AI user
user = AIUser(
name=cfg["name"],
user_id=i,
ai_manager=ai_manager,
color=cfg["color"]
)
else:
# Create human user
user = HumanUser(cfg["name"], i)
users.append(user)
# Create game manager with optional game config and random seed for reproducibility.
game_manager = GameManager(users, game_config=game_config, random_seed=random_seed)
# Setup web visualization
web_viz = WebVisualization(port=web_port, auto_open=False, debug=False)
viz_manager = VisualizationManager()
viz_manager.add_visualization(web_viz)
game_manager.visualization_manager = viz_manager
# Connect AI chat to web visualization
ai_manager.set_chat_callback(lambda player, msg: web_viz.display_chat(player, msg))
# Connect AI status updates to web visualization
ai_manager.set_status_callback(lambda player, status, details: web_viz.display_ai_status(player, status, details))
print(f"\n[OK] Game created!")
print(f"[LOG] Session: {ai_manager.get_session_path()}")
print(f"[SETUP] Random seed: {random_seed}")
if game_config and "victory_points" in game_config:
print(f"[SETUP] Victory points to win: {game_config['victory_points']}")
print()
return game_manager, ai_manager, web_viz
def run_game(game_manager: GameManager, ai_manager: AIManager, web_viz: WebVisualization):
"""
Run the main game loop.
Args:
game_manager: The GameManager instance
ai_manager: The AIManager instance
web_viz: The WebVisualization instance
"""
# Start web server in background
web_viz.start_server()
# Don't open browser here - batch file already opens unified view
# webbrowser.open("http://localhost:5000")
print("=" * 70)
print("[GAME] GAME STARTING!")
print("[WEB] Board: http://localhost:5000/unified")
print("=" * 70)
print()
print("Commands:")
print(" s - Place settlement (e.g., s 14)")
print(" rd - Place road (e.g., rd 14 15)")
print(" r - Roll dice")
print(" e - End turn")
print(" help - Show all commands")
print()
print("=" * 70)
print()
try:
# Initialize the game
game_manager.start_game()
# Run the main game loop
game_manager.game_loop()
print("\n" + "=" * 70)
print("[WIN] GAME OVER!")
print("=" * 70)
except KeyboardInterrupt:
print("\n\n[!] Game interrupted by user")
except Exception as e:
print(f"\n\n[ERROR] Error: {e}")
import traceback
traceback.print_exc()
finally:
# Save session
print("\n[SAVE] Saving session...")
if getattr(ai_manager.config.agent, "async_reactions", False):
print("[SAVE] Waiting briefly for queued social reactions...")
ai_manager.wait_for_reactions(timeout_seconds=10.0)
ai_manager.save_session()
print(f"[LOG] Session saved to: {ai_manager.get_session_path()}")
if hasattr(ai_manager.tts, "close"):
ai_manager.tts.close()
# Show stats
print("\n[STATS] AI Agent Statistics:")
stats = ai_manager.get_stats()
for name, agent_stats in stats.items():
print(f" {name}: {agent_stats['total_requests']} requests, "
f"{agent_stats['total_tokens_used']} tokens")
def _remaining_replay_decisions(game_manager: GameManager) -> int:
"""Count unplayed replay decisions across replay users."""
total = 0
for user in game_manager.users:
total += len(getattr(user, "replay_decisions", []) or [])
return total
def run_replay_viewer(
game_manager: GameManager,
ai_manager: AIManager,
web_viz: WebVisualization,
delay_seconds: float = 2.5,
source_session: Optional[Path] = None,
text_lead_seconds: float = 0.25
) -> None:
"""
Build a recorded-session timeline and serve it to the browser.
The browser controls playback by seeking captured snapshots, so users can
move backward and forward without re-running game logic.
"""
print("=" * 70)
print("[REPLAY] WATCH MODE")
print("[REPLAY] Building seekable timeline...")
print("=" * 70)
print()
try:
raw_speech_prepare_callback = (
getattr(ai_manager.tts, "prepare_blocking", None)
or getattr(ai_manager.tts, "speak_blocking", None)
or getattr(ai_manager.tts, "speak", None)
)
raw_speech_play_callback = (
getattr(ai_manager.tts, "speak_blocking", None)
or getattr(ai_manager.tts, "speak", None)
)
def speech_prepare_callback(player_name: str, message: str) -> None:
if raw_speech_prepare_callback:
raw_speech_prepare_callback(
ai_manager.get_tts_speaker_key(player_name),
message,
)
def speech_play_callback(player_name: str, message: str) -> None:
if raw_speech_play_callback:
raw_speech_play_callback(
ai_manager.get_tts_speaker_key(player_name),
message,
)
web_viz.enable_replay_mode(
source_session=str(source_session or ai_manager.get_session_path()),
delay_seconds=delay_seconds,
speech_prepare_callback=speech_prepare_callback,
speech_play_callback=speech_play_callback,
text_lead_seconds=text_lead_seconds,
)
game_manager.start_game()
web_viz.capture_replay_snapshot("Start")
consumed_items = set()
while game_manager.is_running and not game_manager._check_game_end_conditions():
remaining_before = _remaining_replay_decisions(game_manager)
if remaining_before <= 0:
print("[REPLAY] All recorded decisions were played.")
break
try:
turn_ended = game_manager._handle_single_turn()
except ReplayExhausted as exc:
print(f"[REPLAY] Stopping: {exc}")
break
remaining_after = _remaining_replay_decisions(game_manager)
if remaining_after == remaining_before:
print("[REPLAY] Stopping because no recorded decision was consumed.")
break
if turn_ended:
game_manager._advance_to_next_player()
consumed = None
for user in game_manager.users:
replay_item = getattr(user, "last_replay_item", None)
if replay_item is not None and id(replay_item) not in consumed_items:
consumed = replay_item
consumed_items.add(id(replay_item))
break
label = "Recorded decision"
if consumed:
parsed = consumed.get("parsed") or {}
label = (
f"{consumed.get('player_name')} #{consumed.get('request_number')}: "
f"{parsed.get('action_type')}"
)
web_viz.capture_replay_snapshot(label, consumed)
print("\n" + "=" * 70)
print(f"[REPLAY] Timeline ready: {len(web_viz.replay_timeline)} snapshots")
print("[WEB] Board: http://localhost:5000/unified")
print(f"[REPLAY] Browser playback delay: {delay_seconds:.1f}s")
print(f"[REPLAY] Text lead before action: {text_lead_seconds:.2f}s")
print("=" * 70)
web_viz.seek_replay(0, speak=False)
web_viz.start_server()
try:
webbrowser.open("http://localhost:5000/unified")
except Exception:
pass
print("[REPLAY] Use the browser controls to play, pause, seek, step backward, or step forward.")
print("[REPLAY] Press Ctrl+C here when you are done watching.")
while True:
time.sleep(1)
except KeyboardInterrupt:
print("\n\n[!] Replay interrupted by user")
except Exception as e:
print(f"\n\n[ERROR] Replay error: {e}")
import traceback
traceback.print_exc()
finally:
print("\n[SAVE] Saving replay viewer session...")
ai_manager.save_session()
if hasattr(ai_manager.tts, "close"):
ai_manager.tts.close()
print(f"[LOG] Replay viewer session saved to: {ai_manager.get_session_path()}")
def main():
"""Main entry point."""
import argparse
parser = argparse.ArgumentParser(description="Play Catan with AI agents")
parser.add_argument("--no-llm", action="store_true",
help="Don't send prompts to LLM (offline mode)")
parser.add_argument("--auto", action="store_true",
help="Let AI play automatically (no manual input)")
parser.add_argument("--players", type=int, choices=[2, 3, 4],
help="Number of players (skip setup)")
parser.add_argument("--all-ai", action="store_true",
help="Make all players AI (skip setup)")
parser.add_argument("--names", type=str, nargs="+",
help="Custom names for AI players (e.g., --names Alice Bob Charlie). Also sets player count.")
parser.add_argument("--config", type=str,
help="Path to AI config YAML. Defaults to pycatan/ai/config_dev.yaml when present.")
parser.add_argument("--browser-settings", action="store_true",
help="Open a browser setup screen for Gemini model/API key and player names before starting.")
parser.add_argument("--use-env-keys", action="store_true",
help="In browser settings, use API keys from environment/.env when form fields are left blank.")
parser.add_argument("--ask-api-keys", "--ask-keys", action="store_true",
help="In browser settings, require API keys to be entered in the browser form.")
parser.add_argument("--chat-language", choices=["english", "hebrew"], default=None,
help="Language for public say_outloud table talk.")
parser.add_argument("--hebrew-chat", action="store_true",
help="Shortcut for --chat-language hebrew.")
parser.add_argument("--english-chat", action="store_true",
help="Shortcut for --chat-language english.")
parser.add_argument("--no-reactions", action="store_true",
help="Disable off-turn social reaction prompts.")
parser.add_argument("--async-reactions", action="store_true",
help="Queue off-turn social reactions in per-player background workers.")
parser.add_argument("--sync-reactions", action="store_true",
help="Force off-turn social reactions to run synchronously.")
parser.add_argument("--reaction-batch-size", type=int, default=None,
help="Maximum queued social reaction events to combine into one observer prompt.")
parser.add_argument("--random-seed", type=int, default=0,
help="Random seed for deterministic dice/deck behavior. Default keeps existing behavior: 0.")
parser.add_argument("--replay-session", type=str,
help="Fast-replay parsed actions from an existing session, then continue live.")
parser.add_argument("--resume-session", type=str,
help="Alias for --replay-session.")
parser.add_argument("--replay-max-decisions", type=int,
help="Maximum number of parsed decisions to replay.")
parser.add_argument("--replay-through", type=str,
help="Replay through a marker like Alice:5, inclusive.")
parser.add_argument("--replay-stop-before", type=str,
help="Stop replay before a marker like Alice:6.")
parser.add_argument("--replay-skip-chat", action="store_true",
help="Do not rebroadcast recorded say_outloud chat while fast-replaying.")
parser.add_argument("--watch-replay", action="store_true",
help="Play a recorded session visually and stop when the recording ends. No LLM calls are made.")
parser.add_argument("--analyse-game", action="store_true",
help="Open a recorded session as a visual replay with per-decision analysis.")
parser.add_argument("--replay-delay", type=float, default=2.5,
help="Seconds to wait between recorded decisions in --watch-replay mode.")
parser.add_argument("--replay-text-lead", type=float, default=0.25,
help="Seconds to show recorded chat before rendering that step's game action.")
parser.add_argument("--replay-speak", action="store_true",
help="Speak recorded say_outloud chat during replay using the configured cached TTS provider.")
args = parser.parse_args()
load_env_file()
ai_config = load_ai_config(args.config)
if args.hebrew_chat:
args.chat_language = "hebrew"
if args.english_chat:
args.chat_language = "english"
ai_config.agent.chat_language = normalize_chat_language(
args.chat_language
or os.environ.get("PYCATAN_CHAT_LANGUAGE")
or ai_config.agent.chat_language
)
if args.no_reactions:
ai_config.agent.enable_reactions = False
if args.async_reactions and args.sync_reactions:
parser.error("--async-reactions and --sync-reactions cannot be used together")
if args.async_reactions:
ai_config.agent.async_reactions = True
if args.sync_reactions:
ai_config.agent.async_reactions = False
if args.reaction_batch_size is not None:
if args.reaction_batch_size < 1:
parser.error("--reaction-batch-size must be at least 1")
ai_config.agent.reaction_max_batch_messages = args.reaction_batch_size
browser_player_configs: Optional[List[dict]] = None
browser_game_context = ""
if args.use_env_keys and args.ask_api_keys:
parser.error("--use-env-keys and --ask-api-keys cannot be used together")
if args.browser_settings:
key_mode = "ask" if args.ask_api_keys else "env"
browser_settings = collect_browser_settings(port=5000, key_mode=key_mode)
if browser_settings.get("config_path"):
ai_config = load_ai_config(browser_settings["config_path"])
args.no_llm = browser_settings["no_llm"]
args.replay_session = browser_settings["replay_session"] or None
args.resume_session = None
args.replay_max_decisions = browser_settings["replay_max_decisions"]
args.replay_through = browser_settings["replay_through"]
args.replay_stop_before = browser_settings["replay_stop_before"]
args.replay_skip_chat = browser_settings["replay_skip_chat"]
args.watch_replay = browser_settings["run_mode"] in {"watch_replay", "analyse_game"}
args.analyse_game = browser_settings["run_mode"] == "analyse_game"
args.replay_delay = browser_settings["replay_delay"]
args.replay_text_lead = browser_settings["replay_text_lead"]
args.replay_speak = browser_settings["replay_speak"]
reaction_mode = browser_settings["reaction_mode"]
if reaction_mode == "off":
ai_config.agent.enable_reactions = False
elif reaction_mode == "async":
ai_config.agent.enable_reactions = True
ai_config.agent.async_reactions = True
elif reaction_mode == "sync":
ai_config.agent.enable_reactions = True
ai_config.agent.async_reactions = False
if browser_settings["reaction_batch_size"] is not None:
ai_config.agent.reaction_max_batch_messages = browser_settings["reaction_batch_size"]
ai_config.agent.chat_language = browser_settings["chat_language"]
if browser_settings["api_key"]:
os.environ["GEMINI_API_KEY"] = browser_settings["api_key"]
os.environ["TTS_PROVIDER"] = browser_settings["tts_provider"]
if browser_settings["tts_provider"] == "gemini":
os.environ["GEMINI_TTS_ENABLED"] = "true"
os.environ["GEMINI_TTS_MODEL_ID"] = browser_settings["gemini_tts_model"]
os.environ["GEMINI_TTS_VOICE_NAME"] = browser_settings["gemini_tts_voice"]
os.environ.setdefault("GEMINI_TTS_PLAY_AUDIO", "true")
elif browser_settings["tts_provider"] == "elevenlabs":
os.environ["ELEVENLABS_TTS_ENABLED"] = "true"
os.environ["ELEVENLABS_API_KEY"] = browser_settings["elevenlabs_api_key"]
os.environ["ELEVENLABS_DEFAULT_VOICE_ID"] = browser_settings["elevenlabs_default_voice_id"]
os.environ["ELEVENLABS_TTS_MODEL_ID"] = browser_settings["elevenlabs_tts_model"]
os.environ.setdefault("ELEVENLABS_TTS_OUTPUT_FORMAT", "pcm_16000")
os.environ.setdefault("ELEVENLABS_TTS_PLAY_AUDIO", "true")
ai_config.llm.provider = "gemini"
ai_config.llm.api_key_env_var = "GEMINI_API_KEY"
ai_config.llm.model_name = browser_settings["model"]
browser_player_configs = browser_settings["player_configs"]
args.random_seed = browser_settings["random_seed"]
browser_game_context = browser_settings.get("game_context", "")
args.all_ai = True
print("[SETUP] Browser settings accepted")
replay_session_ref = args.replay_session or args.resume_session
if args.analyse_game:
args.watch_replay = True
if args.watch_replay and not replay_session_ref:
parser.error("--watch-replay/--analyse-game requires --replay-session or --resume-session")
replay_session_path = resolve_session_path(replay_session_ref) if replay_session_ref else None
if (
args.watch_replay
and replay_session_path
and not os.environ.get("AI_TTS_CACHE_DIR")
and not os.environ.get("PYCATAN_TTS_CACHE_DIR")
):
os.environ["AI_TTS_CACHE_DIR"] = str(replay_session_path / "tts_cache")
os.environ["AI_TTS_CACHE_DIR_AUTO"] = "replay_session_default"
print(f"[REPLAY] TTS cache: {os.environ['AI_TTS_CACHE_DIR']}")
elif not args.watch_replay and not os.environ.get("AI_TTS_CACHE_DIR") and not os.environ.get("PYCATAN_TTS_CACHE_DIR"):
print("[TTS] Voice cache: per-session tts_cache/")
replay_decision_list: List[Dict[str, Any]] = []
replay_decisions_by_player: Dict[str, List[Dict[str, Any]]] = {}
replay_player_names: List[str] = []
if replay_session_path:
replay_decision_list = load_replay_decision_chain(
replay_session_path,
max_decisions=args.replay_max_decisions,
replay_through=args.replay_through,
replay_stop_before=args.replay_stop_before
)
replay_decisions_by_player = group_replay_decisions(replay_decision_list)
replay_player_names = infer_players_from_session(replay_session_path)
if not replay_player_names:
replay_player_names = infer_players_from_decisions(replay_decision_list)
print(f"[REPLAY] Source: {replay_session_path}")
print(f"[REPLAY] Loaded {len(replay_decision_list)} parsed decisions")
if (replay_session_path / "session_metadata.json").exists():
print("[REPLAY] Derived-session lineage is included when present")
# Quick setup mode - either explicit --players or inferred from --names
num_players = args.players
# If names provided, infer player count from names (unless explicitly set)
if args.names:
if not num_players:
num_players = min(len(args.names), 4) # Max 4 players
if num_players < 2:
num_players = 2 # Min 2 players
args.all_ai = True # Names implies all-ai mode
elif replay_session_path and replay_player_names:
num_players = min(len(replay_player_names), 4)
args.names = replay_player_names[:num_players]
args.all_ai = True
if browser_player_configs:
player_configs = browser_player_configs
num_players = len(player_configs)
print_banner()
print(
f"Browser setup: {num_players} AI players - "
f"{', '.join(player['name'] for player in player_configs)}"
)
elif num_players and args.all_ai:
colors = ["Red", "Blue", "White", "Orange"]
default_names = ["Alice", "Bob", "Charlie", "Diana"]
# Use custom names if provided, otherwise use defaults
if args.names:
names = args.names[:num_players]
# Pad with defaults if not enough names provided
while len(names) < num_players:
names.append(default_names[len(names)])
else:
names = default_names[:num_players]
player_configs = [
{"name": names[i], "is_ai": True, "color": colors[i]}
for i in range(num_players)
]
print_banner()
print(f"Quick setup: {num_players} AI players - {', '.join(names)}")
else:
# Interactive setup
num_players, player_configs = setup_game()
# Determine mode
send_to_llm = not args.no_llm # Default: send to LLM
manual_actions = not args.auto # Default: manual input
if args.watch_replay:
send_to_llm = False
manual_actions = False
if args.analyse_game:
print("[ANALYSE] Analysis replay enabled: using recorded decisions only")
else:
print("[REPLAY] Watch mode enabled: using recorded decisions only")
print(f"[MODE] LLM: {'ON' if send_to_llm else 'OFF'} | Actions: {'Manual' if manual_actions else 'Auto'}")
print(f"[CONFIG] {ai_config.llm.provider}/{ai_config.llm.model_name}")
if browser_game_context:
print("[CONFIG] Additional game context enabled")
# Create game
game_manager, ai_manager, web_viz = create_game(
player_configs,
send_to_llm=send_to_llm,
manual_actions=manual_actions,
config=ai_config,
replay_decisions=replay_decisions_by_player,
replay_chat=not args.replay_skip_chat,
replay_speak=(args.replay_speak and not args.watch_replay),
replay_only=args.watch_replay,
random_seed=args.random_seed,
game_config={"game_context": browser_game_context} if browser_game_context else None
)
if replay_session_path:
annotate_replay_session(
ai_manager,
replay_session_path,
replay_decision_list,
args.replay_through,
args.replay_stop_before,
mode=(
"analyse_game_visual_playback"
if args.analyse_game
else "watch_replay_visual_playback"
if args.watch_replay
else "fast_action_replay_then_live_ai"
)
)
print(f"[REPLAY] New derived session: {ai_manager.get_session_path()}")
# Run game
if args.watch_replay:
run_replay_viewer(
game_manager,
ai_manager,
web_viz,
delay_seconds=max(0.0, args.replay_delay),
source_session=replay_session_path,
text_lead_seconds=max(0.0, args.replay_text_lead)
)
else:
run_game(game_manager, ai_manager, web_viz)
if __name__ == "__main__":
main()