cyberselfplay-env / client.py
HarshitShri026's picture
cyberenv
562e74f
# Copyright (c) Meta Platforms, Inc. and affiliates.
# All rights reserved.
#
# This source code is licensed under the BSD-style license found in the
# LICENSE file in the root directory of this source tree.
"""CyberSelfPlay Environment Client."""
from typing import Dict
from openenv.core import EnvClient
from openenv.core.client_types import StepResult
from openenv.core.env_server.types import State
from cyber_selfplay_env.models import CyberAction, CyberObservation
class CyberSelfPlayEnv(EnvClient[CyberAction, CyberObservation, State]):
"""
Client for the CyberSelfPlay environment.
This client maintains a persistent WebSocket connection to the environment server,
enabling efficient multi-step interactions with lower latency.
Each client instance has its own dedicated environment session on the server.
"""
def _step_payload(self, action: CyberAction) -> Dict:
"""
Convert CyberAction to JSON payload for step message.
Args:
action: CyberAction instance
Returns:
Dictionary representation suitable for JSON encoding
"""
return {
"actor": action.actor,
"tool_name": action.tool_name,
"target": action.target,
"params": action.params,
"rationale": action.rationale,
}
def _parse_result(self, payload: Dict) -> StepResult[CyberObservation]:
"""
Parse server response into StepResult[CyberObservation].
Args:
payload: JSON response data from server
Returns:
StepResult with CyberObservation
"""
obs_data = payload.get("observation", {})
observation = CyberObservation(
actor=obs_data.get("actor", ""),
public_state=obs_data.get("public_state", {}),
telemetry=obs_data.get("telemetry", []),
incident_summary=obs_data.get("incident_summary", {}),
done=payload.get("done", False),
reward=payload.get("reward", 0.0),
metadata=obs_data.get("metadata", {}),
)
return StepResult(
observation=observation,
reward=payload.get("reward"),
done=payload.get("done", False),
)
def _parse_state(self, payload: Dict) -> State:
"""
Parse server response into State object.
Args:
payload: JSON response from state request
Returns:
State object with episode_id and step_count
"""
return State(
episode_id=payload.get("episode_id"),
step_count=payload.get("step_count", 0),
)