code_assessment_env / client.py
TulasiSankar's picture
update client.py (#5)
b996c20
Raw
History Blame Contribute Delete
2.56 kB
# Copyright (c) Meta Platforms, Inc. and affiliates.
# All rights reserved.
#
# This source code is licensed under the BSD-style license found in the
# LICENSE file in the root directory of this source tree.
"""AI Response Evaluation Environment Client."""
from typing import Dict
from openenv.core import EnvClient
from openenv.core.client_types import StepResult
from openenv.core.env_server.types import State
from .models import CodeAssessmentAction, CodeAssessmentObservation
class CodeAssessmentEnv(
EnvClient[CodeAssessmentAction, CodeAssessmentObservation, State]
):
"""
Client for the AI Response Evaluation Environment.
Example:
>>> env = await CodeAssessmentEnv.from_docker_image("code_assessment_env:latest")
>>> result = await env.reset()
>>> print(result.observation.task_type)
>>> result = await env.step(CodeAssessmentAction(answer="incorrect, factual-error"))
"""
def _step_payload(self, action: CodeAssessmentAction) -> Dict:
return {"answer": action.answer}
def _parse_result(self, payload: Dict) -> StepResult[CodeAssessmentObservation]:
obs_data = payload.get("observation", {})
observation = CodeAssessmentObservation(
problem_description=obs_data.get("problem_description", ""),
difficulty=obs_data.get("difficulty", "easy"),
test_case_input=obs_data.get("test_case_input", ""),
task_type=obs_data.get("task_type", "correctness_check"),
language=obs_data.get("language", "en"),
user_age=obs_data.get("user_age"),
user_mood=obs_data.get("user_mood"),
user_context=obs_data.get("user_context"),
expected_output=obs_data.get("expected_output"),
feedback=obs_data.get("feedback", ""),
is_correct=obs_data.get("is_correct", False),
partial_credit=obs_data.get("partial_credit", 0.0),
problems_solved=obs_data.get("problems_solved", 0),
current_streak=obs_data.get("current_streak", 0),
done=payload.get("done", False),
reward=payload.get("reward"),
metadata=obs_data.get("metadata", {}),
)
return StepResult(
observation=observation,
reward=payload.get("reward"),
done=payload.get("done", False),
)
def _parse_state(self, payload: Dict) -> State:
return State(
episode_id=payload.get("episode_id"),
step_count=payload.get("step_count", 0),
)