trace

Sleeping

trace / server /trace_environment.py

Ayush

Update

4156f51 2 months ago

4.27 kB

	"""
	Trace Environment Implementation.

	An RL environment for Gmail financial transaction intelligence.
	Wraps the internal TraceEnv with the OpenEnv Environment interface.
	"""

	import os
	import sys
	import yaml
	import logging
	from uuid import uuid4

	from openenv.core.env_server.interfaces import Environment
	from openenv.core.env_server.types import State

	logger = logging.getLogger(__name__)

	# Ensure project root is on sys.path so internal imports work in Docker
	_PROJECT_ROOT = os.path.abspath(os.path.join(os.path.dirname(__file__), ".."))
	if _PROJECT_ROOT not in sys.path:
	sys.path.insert(0, _PROJECT_ROOT)

	try:
	from ..models import TraceAction, TraceObservation
	except (ImportError, SystemError):
	from models import TraceAction, TraceObservation

	# Import the internal environment
	from environments.trace_env.core.env import TraceEnv
	from environments.trace_env.core.schemas import TraceAction as InternalAction


	class TraceEnvironment(Environment):
	"""
	OpenEnv-compatible wrapper around the Trace internal environment.

	The environment fetches real financial transaction data from Gmail,
	parses PDF/HTML attachments, and syncs to Google Sheets.

	Example:
	>>> env = TraceEnvironment()
	>>> obs = env.reset()
	>>> print(obs.instruction)
	>>>
	>>> obs = env.step(TraceAction(action_type="RETRIEVE", content="financial emails", source="gmail"))
	>>> print(obs.context)
	"""

	# Single-session only — Gmail tokens are per-user
	SUPPORTS_CONCURRENT_SESSIONS: bool = False

	def __init__(self):
	"""Initialize the Trace environment with config."""
	config_path = os.path.join(_PROJECT_ROOT, "configs", "env_config.yaml")
	try:
	with open(config_path) as f:
	self._config = yaml.safe_load(f) or {}
	except FileNotFoundError:
	logger.warning(f"Config not found at {config_path}, using defaults")
	self._config = {}

	self._env = TraceEnv(self._config)
	self._state = State(episode_id=str(uuid4()), step_count=0)

	def reset(self) -> TraceObservation:
	"""
	Reset the environment and start a new episode.

	Returns:
	TraceObservation with initial state
	"""
	task = {
	"instruction": "Audit my financial transactions from Gmail.",
	"difficulty": "medium",
	"available_sources": ["gmail", "image"],
	"ground_truth": {},
	}
	obs = self._env.reset(task)
	self._state = State(episode_id=obs.episode_id, step_count=0)

	return TraceObservation(
	episode_id=obs.episode_id,
	step=obs.step,
	instruction=obs.instruction,
	available_sources=obs.available_sources,
	context=obs.context,
	memory_summary=obs.memory_summary,
	world_state=obs.world_state,
	done=False,
	reward=0.0,
	)

	def step(self, action: TraceAction) -> TraceObservation: # type: ignore[override]
	"""
	Execute one agent action in the environment.

	Args:
	action: TraceAction containing action_type, content, source

	Returns:
	TraceObservation with results
	"""
	# Convert OpenEnv action → internal action
	internal_action = InternalAction(
	action_type=action.action_type,
	content=action.content,
	source=action.source,
	metadata=action.metadata,
	)

	obs, reward, done, info = self._env.step(internal_action)
	self._state.step_count += 1

	return TraceObservation(
	episode_id=obs.episode_id,
	step=obs.step,
	instruction=obs.instruction,
	available_sources=obs.available_sources,
	context=obs.context,
	memory_summary=obs.memory_summary,
	world_state=obs.world_state,
	done=done,
	reward=reward,
	metadata=info,
	)

	@property
	def state(self) -> State:
	"""
	Get the current environment state.

	Returns:
	Current State with episode_id and step_count
	"""
	return self._state