Spaces:

DuckHuggingFace
/

text-adventure-agent

No application file

App Files Files Community

DuckHuggingFace commited on Feb 16

Commit

38c0f49

1 Parent(s): 75629a4

cleanup for submissions

Browse files

Files changed (9) hide show

.gitignore +5 -0
example_submission/agent.py +0 -404
games/__pycache__/__init__.cpython-313.pyc +0 -0
games/__pycache__/zork_env.cpython-313.pyc +0 -0
mcp_server.py +0 -196
{example_submission → submission}/README.md +0 -0
agent.py → submission/agent.py +0 -0
app.py → submission/app.py +0 -0
{example_submission → submission}/mcp_server.py +0 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,5 @@

+submission_template/**
+**/__pycache__/**
+.venv/**
+.env
+z-machines-games-master/**

example_submission/agent.py DELETED Viewed

@@ -1,404 +0,0 @@
-"""
-Example: MCP ReAct Agent
-A complete ReAct agent that uses MCP tools to play text adventure games.
-This is a working example students can learn from.
-"""
-import json
-import os
-import re
-from dataclasses import dataclass, field
-from typing import Optional
-from dotenv import load_dotenv
-from huggingface_hub import InferenceClient
-load_dotenv()
-# =============================================================================
-# LLM Configuration - DO NOT MODIFY
-# =============================================================================
-LLM_MODEL = "Qwen/Qwen2.5-72B-Instruct"
-_hf_token = os.getenv("HF_TOKEN")
-if not _hf_token:
-    raise ValueError("HF_TOKEN not found. Set it in your .env file.")
-LLM_CLIENT = InferenceClient(token=_hf_token)
-def call_llm(prompt: str, system_prompt: str, seed: int, max_tokens: int = 300) -> str:
-    """Call the LLM with the given prompt."""
-    messages = [
-        {"role": "system", "content": system_prompt},
-        {"role": "user", "content": prompt},
-    ]
-    response = LLM_CLIENT.chat.completions.create(
-        model=LLM_MODEL,
-        messages=messages,
-        temperature=0.0,
-        max_tokens=max_tokens,
-        seed=seed,
-    )
-    return response.choices[0].message.content
-@dataclass
-class RunResult:
-    """Result of running the agent. Do not modify this class."""
-    final_score: int
-    max_score: int
-    moves: int
-    locations_visited: set[str]
-    game_completed: bool
-    error: Optional[str] = None
-    history: list[tuple[str, str, str]] = field(default_factory=list)
-# =============================================================================
-# System Prompt
-# =============================================================================
-SYSTEM_PROMPT = """You are an expert text adventure game player. Your goal is to explore, collect treasures, and maximize your score.
-AVAILABLE TOOLS (use these via MCP):
-1. play_action - Execute game commands (north, take lamp, open mailbox, etc.)
-2. memory - Get current game state, score, and recent history
-3. get_map - See explored locations and connections
-4. inventory - Check what you're carrying
-VALID GAME COMMANDS for play_action:
-- Movement: north, south, east, west, up, down, enter, exit
-- Objects: take <item>, drop <item>, open <thing>, close <thing>, examine <thing>
-- Light: turn on lamp, turn off lamp
-- Combat: attack <enemy> with <weapon>
-- Other: inventory, look, read <thing>, wait
-FORBIDDEN (will NOT work): check, inspect, search, grab, use, help
-RESPOND IN THIS EXACT FORMAT (no markdown):
-THOUGHT: <brief reasoning about what to do next>
-TOOL: <tool_name>
-ARGS: <JSON arguments>
-Examples:
-THOUGHT: I need to see what's around me.
-TOOL: play_action
-ARGS: {"action": "look"}
-THOUGHT: Let me check my current state and score.
-TOOL: memory
-ARGS: {}
-THOUGHT: The mailbox might contain something useful.
-TOOL: play_action
-ARGS: {"action": "open mailbox"}
-STRATEGY:
-1. Start by looking around and checking memory
-2. Explore systematically - try all directions
-3. Pick up useful items (lamp, sword, etc.)
-4. Open containers (mailbox, window, etc.)
-5. Use get_map to avoid getting lost
-6. Turn on lamp before dark areas!
-DO NOT repeat the same action multiple times in a row."""
-# =============================================================================
-# Student Agent Implementation
-# =============================================================================
-class StudentAgent:
-    """
-    MCP ReAct Agent - A complete working example.
-    This agent demonstrates:
-    - ReAct loop (Thought -> Tool -> Observation)
-    - Loop detection
-    - Action validation
-    - Score tracking via memory tool
-    """
-    def __init__(self):
-        """Initialize the agent state."""
-        self.history: list[dict] = []
-        self.recent_actions: list[str] = []
-        self.score: int = 0
-    async def run(
-        self,
-        client,
-        game: str,
-        max_steps: int,
-        seed: int,
-        verbose: bool = False,
-    ) -> RunResult:
-        """Run the agent for a game session."""
-        locations_visited = set()
-        history = []
-        moves = 0
-        # Get list of available tools
-        tools = await client.list_tools()
-        tool_names = [t.name for t in tools]
-        # Get initial observation
-        result = await client.call_tool("play_action", {"action": "look"})
-        observation = self._extract_result(result)
-        # Track initial location
-        location = observation.split("\n")[0] if observation else "Unknown"
-        locations_visited.add(location)
-        if verbose:
-            print(f"\n{observation}")
-        # Main ReAct loop
-        for step in range(1, max_steps + 1):
-            # Build prompt with context
-            prompt = self._build_prompt(observation)
-            # Call LLM for reasoning (use step-based seed for variety)
-            response = call_llm(prompt, SYSTEM_PROMPT, seed + step)
-            # Parse the response
-            thought, tool_name, tool_args = self._parse_response(response, tool_names)
-            if verbose:
-                print(f"\n--- Step {step} ---")
-                print(f"[THOUGHT] {thought}")
-                print(f"[TOOL] {tool_name}({tool_args})")
-            # Validate and fix common issues
-            tool_name, tool_args = self._validate_tool_call(tool_name, tool_args, tool_names)
-            # Loop detection
-            if tool_name == "play_action":
-                action = tool_args.get("action", "look")
-                self.recent_actions.append(action)
-                if len(self.recent_actions) > 5:
-                    self.recent_actions = self.recent_actions[-5:]
-                # Detect loops - if same action 3 times, force "look"
-                if len(self.recent_actions) >= 3 and len(set(self.recent_actions[-3:])) == 1:
-                    if verbose:
-                        print(f"[WARNING] Loop detected - forcing 'look'")
-                    tool_args = {"action": "look"}
-                    self.recent_actions.append("look")
-                moves += 1
-            # Execute the tool
-            try:
-                result = await client.call_tool(tool_name, tool_args)
-                observation = self._extract_result(result)
-                if verbose:
-                    print(f"[RESULT] {observation[:200]}...")
-            except Exception as e:
-                observation = f"Error: {e}"
-                if verbose:
-                    print(f"[ERROR] {e}")
-            # Track location
-            location = observation.split("\n")[0] if observation else "Unknown"
-            locations_visited.add(location)
-            # Update history
-            self.history.append({
-                "step": step,
-                "thought": thought,
-                "tool": tool_name,
-                "args": tool_args,
-                "result": observation[:200]
-            })
-            if len(self.history) > 10:
-                self.history = self.history[-10:]
-            # Track score from observation
-            self._update_score(observation)
-            # Record in result history
-            history.append((thought, f"{tool_name}({tool_args})", observation[:100]))
-            # Check for game over
-            if self._is_game_over(observation):
-                if verbose:
-                    print("\n*** GAME OVER ***")
-                break
-        return RunResult(
-            final_score=self.score,
-            max_score=350,
-            moves=moves,
-            locations_visited=locations_visited,
-            game_completed=self._is_game_over(observation),
-            history=history,
-        )
-    def _build_prompt(self, observation: str) -> str:
-        """Build the prompt for the LLM with context."""
-        parts = []
-        parts.append(f"Current Score: {self.score}")
-        # Recent history
-        if self.history:
-            parts.append("\nRecent actions:")
-            for entry in self.history[-3:]:
-                action = entry.get("args", {}).get("action", entry["tool"])
-                result_short = entry["result"][:80] + "..." if len(entry["result"]) > 80 else entry["result"]
-                parts.append(f"  > {action} -> {result_short}")
-            # Warn about repeated actions
-            if self.recent_actions and len(set(self.recent_actions[-3:])) == 1:
-                parts.append(f"\n[WARNING: You've been doing '{self.recent_actions[-1]}' repeatedly. TRY SOMETHING DIFFERENT!]")
-        parts.append(f"\nCurrent situation:\n{observation}")
-        parts.append("\nWhat do you do next?")
-        return "\n".join(parts)
-    def _parse_response(self, response: str, valid_tools: list[str]) -> tuple[str, str, dict]:
-        """Parse the LLM response to extract thought, tool, and arguments."""
-        thought = "No reasoning provided"
-        tool_name = "play_action"
-        tool_args = {"action": "look"}
-        lines = response.strip().split("\n")
-        for line in lines:
-            line_clean = line.strip()
-            line_upper = line_clean.upper()
-            if line_upper.startswith("THOUGHT:"):
-                thought = line_clean.split(":", 1)[1].strip()
-            elif line_upper.startswith("TOOL:"):
-                raw_tool = line_clean.split(":", 1)[1].strip().lower()
-                raw_tool = raw_tool.replace("**", "").replace("*", "").replace("`", "")
-                raw_tool = raw_tool.split()[0] if raw_tool else "play_action"
-                tool_name = raw_tool
-            elif line_upper.startswith("ARGS:"):
-                args_part = line_clean.split(":", 1)[1].strip()
-                try:
-                    args_part = args_part.replace("'", '"')
-                    tool_args = json.loads(args_part)
-                except json.JSONDecodeError:
-                    match = re.search(r'"action"\s*:\s*"([^"]+)"', args_part)
-                    if match:
-                        tool_args = {"action": match.group(1)}
-                    else:
-                        tool_args = {"action": "look"}
-        return thought, tool_name, tool_args
-    def _validate_tool_call(self, tool_name: str, tool_args: dict, valid_tools: list[str]) -> tuple[str, dict]:
-        """Validate and fix common tool call issues."""
-        # Fix tool name
-        if tool_name not in valid_tools:
-            if tool_name in ["action", "do", "command"]:
-                tool_name = "play_action"
-            elif tool_name in ["map", "location"]:
-                tool_name = "get_map"
-            elif tool_name in ["mem", "state", "status"]:
-                tool_name = "memory"
-            elif tool_name in ["inv", "items"]:
-                tool_name = "inventory"
-            else:
-                tool_name = "play_action"
-        # Fix action verbs
-        if tool_name == "play_action":
-            action = tool_args.get("action", "look")
-            invalid_verb_map = {
-                "check": "examine",
-                "inspect": "examine",
-                "search": "look",
-                "grab": "take",
-                "pick": "take",
-                "use": "examine",
-                "investigate": "examine",
-            }
-            words = action.lower().split()
-            if words and words[0] in invalid_verb_map:
-                words[0] = invalid_verb_map[words[0]]
-                action = " ".join(words)
-            action = action.lower().strip()
-            action = action.replace("**", "").replace("*", "").replace("`", "")
-            action = " ".join(action.split())
-            tool_args["action"] = action
-        return tool_name, tool_args
-    def _extract_result(self, result) -> str:
-        """Extract text from MCP tool result."""
-        if hasattr(result, 'content') and result.content:
-            return result.content[0].text
-        if isinstance(result, list) and result:
-            return result[0].text if hasattr(result[0], 'text') else str(result[0])
-        return str(result)
-    def _update_score(self, text: str) -> None:
-        """Update score from game text."""
-        patterns = [
-            r'Score:\s*(\d+)',
-            r'score[:\s]+(\d+)',
-            r'\[Score:\s*(\d+)',
-        ]
-        for pattern in patterns:
-            match = re.search(pattern, text, re.IGNORECASE)
-            if match:
-                self.score = max(self.score, int(match.group(1)))
-    def _is_game_over(self, text: str) -> bool:
-        """Check if the game is over."""
-        game_over_phrases = [
-            "game over",
-            "you have died",
-            "you are dead",
-            "*** you have died ***",
-        ]
-        text_lower = text.lower()
-        return any(phrase in text_lower for phrase in game_over_phrases)
-# =============================================================================
-# Local Testing
-# =============================================================================
-async def test_agent():
-    """Test the agent locally."""
-    from fastmcp import Client
-    agent = StudentAgent()
-    async with Client("mcp_server.py") as client:
-        result = await agent.run(
-            client=client,
-            game="zork1",
-            max_steps=20,
-            seed=42,
-            verbose=True,
-        )
-        print(f"\n{'=' * 50}")
-        print(f"Final Score: {result.final_score}")
-        print(f"Moves: {result.moves}")
-        print(f"Locations: {len(result.locations_visited)}")
-if __name__ == "__main__":
-    import asyncio
-    asyncio.run(test_agent())

games/__pycache__/__init__.cpython-313.pyc DELETED Viewed

Binary file (374 Bytes)

games/__pycache__/zork_env.cpython-313.pyc DELETED Viewed

Binary file (9.63 kB)

mcp_server.py DELETED Viewed

@@ -1,196 +0,0 @@
-"""
-Example: MCP Server for Text Adventures
-A complete MCP server that exposes text adventure games via tools.
-This demonstrates a full-featured server with memory, mapping, and inventory.
-"""
-import sys
-import os
-# Add parent directory to path to import games module
-sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
-from fastmcp import FastMCP
-from games.zork_env import TextAdventureEnv, list_available_games
-# Get game from environment variable (default: zork1)
-INITIAL_GAME = os.environ.get("GAME", "zork1")
-# Create the MCP server
-mcp = FastMCP("Text Adventure Server")
-class GameState:
-    """Manages the text adventure game state and exploration data."""
-    def __init__(self, game: str = "zork1"):
-        self.game_name = game
-        self.env = TextAdventureEnv(game)
-        self.state = self.env.reset()
-        self.history: list[tuple[str, str]] = []
-        self.explored_locations: dict[str, set[str]] = {}
-        self.current_location: str = self._extract_location(self.state.observation)
-    def _extract_location(self, observation: str) -> str:
-        """Extract location name from observation (usually first line)."""
-        lines = observation.strip().split('\n')
-        return lines[0] if lines else "Unknown"
-    def take_action(self, action: str) -> str:
-        """Execute a game action and return the result."""
-        self.state = self.env.step(action)
-        result = self.state.observation
-        # Track history
-        self.history.append((action, result))
-        if len(self.history) > 50:
-            self.history = self.history[-50:]
-        # Update map
-        new_location = self._extract_location(result)
-        if action in ["north", "south", "east", "west", "up", "down",
-                      "enter", "exit", "n", "s", "e", "w", "u", "d"]:
-            if self.current_location not in self.explored_locations:
-                self.explored_locations[self.current_location] = set()
-            if new_location != self.current_location:
-                self.explored_locations[self.current_location].add(f"{action} -> {new_location}")
-        self.current_location = new_location
-        return result
-    def get_memory(self) -> str:
-        """Get a summary of current game state."""
-        recent = self.history[-5:] if self.history else []
-        recent_str = "\n".join([f"  > {a} -> {r[:60]}..." for a, r in recent]) if recent else "  (none yet)"
-        return f"""Current State:
-- Location: {self.current_location}
-- Score: {self.state.score} points
-- Moves: {self.state.moves}
-- Game: {self.game_name}
-Recent Actions:
-{recent_str}
-Current Observation:
-{self.state.observation}"""
-    def get_map(self) -> str:
-        """Get a map of explored locations."""
-        if not self.explored_locations:
-            return "Map: No locations explored yet. Try moving around!"
-        lines = ["Explored Locations and Exits:"]
-        for loc, exits in sorted(self.explored_locations.items()):
-            lines.append(f"\n* {loc}")
-            for exit_info in sorted(exits):
-                lines.append(f"    -> {exit_info}")
-        lines.append(f"\n[Current] {self.current_location}")
-        return "\n".join(lines)
-    def get_inventory(self) -> str:
-        """Get current inventory."""
-        items = self.state.inventory if hasattr(self.state, 'inventory') and self.state.inventory else []
-        if not items:
-            return "Inventory: You are empty-handed."
-        item_names = []
-        for item in items:
-            item_str = str(item)
-            item_lower = item_str.lower()
-            if "parent" in item_lower:
-                idx = item_lower.index("parent")
-                name = item_str[:idx].strip()
-                if ":" in name:
-                    name = name.split(":", 1)[1].strip()
-                item_names.append(name)
-            elif ":" in item_str:
-                name = item_str.split(":")[1].strip()
-                item_names.append(name)
-            else:
-                item_names.append(item_str)
-        return f"Inventory: {', '.join(item_names)}"
-# Global game state
-_game_state: GameState | None = None
-def get_game() -> GameState:
-    """Get or initialize the game state."""
-    global _game_state
-    if _game_state is None:
-        _game_state = GameState(INITIAL_GAME)
-    return _game_state
-# =============================================================================
-# MCP Tools
-# =============================================================================
-@mcp.tool()
-def play_action(action: str) -> str:
-    """
-    Execute a game action in the text adventure.
-    Args:
-        action: The command to execute (e.g., 'north', 'take lamp', 'open mailbox')
-    Returns:
-        The game's response to your action
-    """
-    game = get_game()
-    result = game.take_action(action)
-    # Add score info
-    score_info = f"\n\n[Score: {game.state.score} | Moves: {game.state.moves}]"
-    if game.state.reward > 0:
-        score_info = f"\n\n+{game.state.reward} points! (Total: {game.state.score})"
-    done_info = ""
-    if game.state.done:
-        done_info = "\n\nGAME OVER"
-    return result + score_info + done_info
-@mcp.tool()
-def memory() -> str:
-    """
-    Get a summary of the current game state.
-    Returns location, score, moves, recent actions, and current observation.
-    """
-    return get_game().get_memory()
-@mcp.tool()
-def get_map() -> str:
-    """
-    Get a map showing explored locations and connections.
-    Useful for navigation and avoiding getting lost.
-    """
-    return get_game().get_map()
-@mcp.tool()
-def inventory() -> str:
-    """
-    Check what items you are currently carrying.
-    """
-    return get_game().get_inventory()
-# =============================================================================
-# Main
-# =============================================================================
-if __name__ == "__main__":
-    mcp.run()

{example_submission → submission}/README.md RENAMED Viewed

File without changes

agent.py → submission/agent.py RENAMED Viewed

File without changes

app.py → submission/app.py RENAMED Viewed

File without changes

{example_submission → submission}/mcp_server.py RENAMED Viewed

File without changes