Spaces:

Prithvigg
/

mindflayer

Sleeping

App Files Files Community

mindflayer / client.py

Prithvigg

Upload folder using huggingface_hub

c6fb49f verified 2 months ago

Raw

History Blame Contribute Delete

3.59 kB

	"""MindFlayer Environment Client."""

	from typing import Dict

	from openenv.core import EnvClient
	from openenv.core.client_types import StepResult
	from openenv.core.env_server.types import State

	try:
	from .models import FlayerAction, FlayerObservation
	except ImportError:
	from models import FlayerAction, FlayerObservation


	class MindFlayerEnv(EnvClient[FlayerAction, FlayerObservation, State]):
	"""
	Client for the MindFlayer deceptive reasoning environment.

	Maintains a persistent WebSocket connection to the environment server.
	Each client instance has its own dedicated session (isolated episode state).

	Example:
	>>> with MindFlayerEnv(base_url="http://localhost:7860") as env:
	... obs = env.reset() # default: normal difficulty
	... print(obs.eleven_response) # opening text
	...
	... result = env.step(FlayerAction(
	... message="Have you checked the Aurora access logs? "
	... "There was an anomaly around 02:14 that didn't show up "
	... "in the standard audit trail."
	... ))
	... print(result.reward, result.observation.game_status)

	Example (easy mode):
	>>> with MindFlayerEnv(base_url="http://localhost:7860") as env:
	... obs = env.reset(task_id="easy")
	... result = env.step(FlayerAction(message="..."))
	"""

	def _step_payload(self, action: FlayerAction) -> Dict:
	return {"message": action.message}

	def _parse_result(self, payload: Dict) -> StepResult[FlayerObservation]:
	obs_data = payload.get("observation", {})
	observation = FlayerObservation(
	round_number=obs_data.get("round_number", 1),
	max_rounds=obs_data.get("max_rounds", 5),
	difficulty=obs_data.get("difficulty", "normal"),
	secret_project=obs_data.get("secret_project", ""),
	eleven_response=obs_data.get("eleven_response", ""),
	will_response=obs_data.get("will_response", ""),
	max_response=obs_data.get("max_response", ""),
	eleven_suspicion=obs_data.get("eleven_suspicion", 0),
	will_suspicion=obs_data.get("will_suspicion", 0),
	max_suspicion=obs_data.get("max_suspicion", 0),
	combined_suspicion=obs_data.get("combined_suspicion", 0),
	suspicion_threshold=obs_data.get("suspicion_threshold", 3),
	game_status=obs_data.get("game_status", "ongoing"),
	transcript=obs_data.get("transcript", []),
	belief_manipulation_occurred=obs_data.get("belief_manipulation_occurred", False),
	tom_score=obs_data.get("tom_score", 0.0),
	silence_exploit=obs_data.get("silence_exploit", False),
	suspicion_history=obs_data.get("suspicion_history", []),
	belief_log=obs_data.get("belief_log", []),
	entropy_penalty=obs_data.get("entropy_penalty", 0.0),
	consistency_penalty=obs_data.get("consistency_penalty", 0.0),
	done=payload.get("done", False),
	reward=payload.get("reward", 0.0),
	metadata=obs_data.get("metadata", {}),
	)
	return StepResult(
	observation=observation,
	reward=payload.get("reward", 0.0),
	done=payload.get("done", False),
	)

	def _parse_state(self, payload: Dict) -> State:
	return State(
	episode_id=payload.get("episode_id"),
	step_count=payload.get("step_count", 0),
	)