myenv / server /myenv_environment.py
zkwentz's picture
Upload folder using huggingface_hub
7b3bda1 verified
# Copyright (c) Meta Platforms, Inc. and affiliates.
# All rights reserved.
#
# This source code is licensed under the BSD-style license found in the
# LICENSE file in the root directory of this source tree.
"""
Myenv Environment Implementation.
A simple test environment that echoes back messages sent to it.
Perfect for testing HTTP server infrastructure.
"""
from uuid import uuid4
from openenv_core.env_server.interfaces import Environment
from openenv_core.env_server.types import State
from myenv.models import MyenvAction, MyenvObservation
class MyenvEnvironment(Environment):
"""
A simple echo environment that echoes back messages.
This environment is designed for testing the HTTP server infrastructure.
It maintains minimal state and simply echoes back whatever message it receives.
Example:
>>> env = MyenvEnvironment()
>>> obs = env.reset()
>>> print(obs.echoed_message) # "Myenv environment ready!"
>>>
>>> obs = env.step(MyenvAction(message="Hello"))
>>> print(obs.echoed_message) # "Hello"
>>> print(obs.message_length) # 5
"""
def __init__(self):
"""Initialize the myenv environment."""
self._state = State(episode_id=str(uuid4()), step_count=0)
self._reset_count = 0
def reset(self) -> MyenvObservation:
"""
Reset the environment.
Returns:
MyenvObservation with a ready message
"""
self._state = State(episode_id=str(uuid4()), step_count=0)
self._reset_count += 1
return MyenvObservation(
echoed_message="Myenv environment ready!",
message_length=0,
done=False,
reward=0.0,
)
def step(self, action: MyenvAction) -> MyenvObservation: # type: ignore[override]
"""
Execute a step in the environment by echoing the message.
Args:
action: MyenvAction containing the message to echo
Returns:
MyenvObservation with the echoed message and its length
"""
self._state.step_count += 1
message = action.message
length = len(message)
# Simple reward: longer messages get higher rewards
reward = length * 0.1
return MyenvObservation(
echoed_message=message,
message_length=length,
done=False,
reward=reward,
metadata={"original_message": message, "step": self._state.step_count},
)
@property
def state(self) -> State:
"""
Get the current environment state.
Returns:
Current State with episode_id and step_count
"""
return self._state