Spaces:

zkwentz
/

myenv

Sleeping

App Files Files Community

myenv / server /myenv_environment.py

zkwentz

Upload folder using huggingface_hub

7b3bda1 verified 6 months ago

raw

history blame contribute delete

2.74 kB

	# Copyright (c) Meta Platforms, Inc. and affiliates.
	# All rights reserved.
	#
	# This source code is licensed under the BSD-style license found in the
	# LICENSE file in the root directory of this source tree.

	"""
	Myenv Environment Implementation.

	A simple test environment that echoes back messages sent to it.
	Perfect for testing HTTP server infrastructure.
	"""

	from uuid import uuid4

	from openenv_core.env_server.interfaces import Environment
	from openenv_core.env_server.types import State

	from myenv.models import MyenvAction, MyenvObservation


	class MyenvEnvironment(Environment):
	"""
	A simple echo environment that echoes back messages.

	This environment is designed for testing the HTTP server infrastructure.
	It maintains minimal state and simply echoes back whatever message it receives.

	Example:
	>>> env = MyenvEnvironment()
	>>> obs = env.reset()
	>>> print(obs.echoed_message) # "Myenv environment ready!"
	>>>
	>>> obs = env.step(MyenvAction(message="Hello"))
	>>> print(obs.echoed_message) # "Hello"
	>>> print(obs.message_length) # 5
	"""

	def __init__(self):
	"""Initialize the myenv environment."""
	self._state = State(episode_id=str(uuid4()), step_count=0)
	self._reset_count = 0

	def reset(self) -> MyenvObservation:
	"""
	Reset the environment.

	Returns:
	MyenvObservation with a ready message
	"""
	self._state = State(episode_id=str(uuid4()), step_count=0)
	self._reset_count += 1

	return MyenvObservation(
	echoed_message="Myenv environment ready!",
	message_length=0,
	done=False,
	reward=0.0,
	)

	def step(self, action: MyenvAction) -> MyenvObservation: # type: ignore[override]
	"""
	Execute a step in the environment by echoing the message.

	Args:
	action: MyenvAction containing the message to echo

	Returns:
	MyenvObservation with the echoed message and its length
	"""
	self._state.step_count += 1

	message = action.message
	length = len(message)

	# Simple reward: longer messages get higher rewards
	reward = length * 0.1

	return MyenvObservation(
	echoed_message=message,
	message_length=length,
	done=False,
	reward=reward,
	metadata={"original_message": message, "step": self._state.step_count},
	)

	@property
	def state(self) -> State:
	"""
	Get the current environment state.

	Returns:
	Current State with episode_id and step_count
	"""
	return self._state