Spaces:

burtenshaw
/

gpu_mode

Sleeping

App Files Files Community

gpu_mode / server /gpu_mode_environment.py

burtenshaw HF Staff

Upload folder using huggingface_hub

53022c7 verified 17 days ago

raw

history blame contribute delete

3.1 kB

	# Copyright (c) Meta Platforms, Inc. and affiliates.
	# All rights reserved.
	#
	# This source code is licensed under the BSD-style license found in the
	# LICENSE file in the root directory of this source tree.

	"""
	Gpu Mode Environment Implementation.

	A simple test environment that echoes back messages sent to it.
	Perfect for testing HTTP server infrastructure.
	"""

	from uuid import uuid4

	from openenv.core.env_server.interfaces import Environment
	from openenv.core.env_server.types import State

	from models import GpuModeAction, GpuModeObservation


	class GpuModeEnvironment(Environment):
	"""
	A simple echo environment that echoes back messages.

	This environment is designed for testing the HTTP server infrastructure.
	It maintains minimal state and simply echoes back whatever message it receives.

	Example:
	>>> env = GpuModeEnvironment()
	>>> obs = env.reset()
	>>> print(obs.echoed_message) # "Gpu Mode environment ready!"
	>>>
	>>> obs = env.step(GpuModeAction(message="Hello"))
	>>> print(obs.echoed_message) # "Hello"
	>>> print(obs.message_length) # 5
	"""

	# Enable concurrent WebSocket sessions.
	# Set to True if your environment isolates state between instances.
	# When True, multiple WebSocket clients can connect simultaneously, each
	# getting their own environment instance (when using factory mode in app.py).
	SUPPORTS_CONCURRENT_SESSIONS: bool = True

	def __init__(self):
	"""Initialize the gpu_mode environment."""
	self._state = State(episode_id=str(uuid4()), step_count=0)
	self._reset_count = 0

	def reset(self) -> GpuModeObservation:
	"""
	Reset the environment.

	Returns:
	GpuModeObservation with a ready message
	"""
	self._state = State(episode_id=str(uuid4()), step_count=0)
	self._reset_count += 1

	return GpuModeObservation(
	echoed_message="Gpu Mode environment ready!",
	message_length=0,
	done=False,
	reward=0.0,
	)

	def step(self, action: GpuModeAction) -> GpuModeObservation: # type: ignore[override]
	"""
	Execute a step in the environment by echoing the message.

	Args:
	action: GpuModeAction containing the message to echo

	Returns:
	GpuModeObservation with the echoed message and its length
	"""
	self._state.step_count += 1

	message = action.message
	length = len(message)

	# Simple reward: longer messages get higher rewards
	reward = length * 0.1

	return GpuModeObservation(
	echoed_message=message,
	message_length=length,
	done=False,
	reward=reward,
	metadata={"original_message": message, "step": self._state.step_count},
	)

	@property
	def state(self) -> State:
	"""
	Get the current environment state.

	Returns:
	Current State with episode_id and step_count
	"""
	return self._state