Spaces:

huggingmenfordays
/

sysadmin-env

Paused

App Files Files Community

sysadmin-env / sysadmin_env /models.py

huggingmenfordays

Upload folder using huggingface_hub

4732653 verified about 1 month ago

raw

history blame contribute delete

1.87 kB

	from enum import Enum
	from typing import Optional

	from pydantic import BaseModel
	from pydantic import Field


	class DifficultyTier(str, Enum):
	easy = "easy"
	medium = "medium"
	hard = "hard"


	class Action(BaseModel):
	command: str = Field(min_length=1)
	reasoning: Optional[str] = None


	class Observation(BaseModel):
	stdout: str
	stderr: str
	exit_code: int
	working_directory: str
	execution_time: float = Field(ge=0.0)
	reward: float
	done: bool
	step_number: int = Field(ge=0)
	max_steps: int = Field(gt=0)


	class EnvironmentState(BaseModel):
	episode_id: str = Field(min_length=1)
	task_id: str = Field(min_length=1)
	step_count: int = Field(ge=0)
	max_steps: int = Field(gt=0)
	done: bool
	reward: float


	class ResetRequest(BaseModel):
	task_id: Optional[str] = None


	class StepRequest(BaseModel):
	action: Action


	class StepResult(BaseModel):
	observation: Observation
	state: EnvironmentState


	class TaskMetadata(BaseModel):
	task_id: str = Field(min_length=1)
	difficulty: DifficultyTier
	description: str
	max_steps: int = Field(gt=0)
	time_limit: float = Field(gt=0.0)
	base_filesystem_path: str


	class RewardSignal(BaseModel):
	health_delta: float
	knowledge_delta: float = Field(ge=0.0)
	action_penalty: float = Field(le=0.0)
	total_reward: float


	class DiagnosticTrigger(BaseModel):
	fact_id: str = Field(min_length=1)
	command_patterns: list[str] = Field(min_length=1)
	reward: float = Field(gt=0.0)


	class TaskScenarioState(BaseModel):
	health: float = Field(ge=0.0, le=1.0)
	done: bool
	details: dict[str, bool \| float \| str]


	class TaskScenarioDefinition(BaseModel):
	metadata: TaskMetadata
	requires_network_isolation: bool = True
	diagnostic_triggers: list[DiagnosticTrigger] = Field(default_factory=list)