tarantula11
/

nitroval10

Model card Files Files and versions

nitroval10 / agent_interface.py

tarantula11's picture

Upload submission from kinitro-agent-template

fe5151f verified 7 months ago

history blame contribute delete

1.57 kB

	"""
	Abstract base class defining the standard interface for all agents.

	All miner-submitted agents must implement this interface to be evaluated.
	"""

	from abc import ABC, abstractmethod

	import gymnasium as gym
	import numpy as np
	import torch


	class AgentInterface(ABC):
	"""
	Standard interface that all miner implementations must follow.

	This ensures a consistent contract between the evaluator and any submitted agent,
	regardless of the underlying model architecture or implementation details.
	"""

	def __init__(
	self,
	observation_space: gym.Space \| None = None,
	action_space: gym.Space \| None = None,
	seed: int \| None = None,
	**kwargs,
	):
	self.observation_space = observation_space or gym.spaces.Box(
	low=-1, high=1, shape=(100,), dtype=np.float32
	)
	self.action_space = action_space or gym.spaces.Box(
	low=-1, high=1, shape=(4,), dtype=np.float32
	)
	self.seed = seed or np.random.randint(0, 1000000)
	self.rng = np.random.default_rng(seed)

	@abstractmethod
	def act(self, obs: dict, **kwargs) -> torch.Tensor:
	"""
	Take action given current observation and any additional arguments.
	"""
	pass

	def reset(self) -> None:
	"""
	Reset agent state for new episode.

	This is called at the beginning of each episode. Stateless agents
	can implement this as a no-op. Agents with internal memory/history
	should reset their state here.
	"""
	pass