Spaces:
Sleeping
Sleeping
| # Copyright (c) Meta Platforms, Inc. and affiliates. | |
| # All rights reserved. | |
| # | |
| # This source code is licensed under the BSD-style license found in the | |
| # LICENSE file in the root directory of this source tree. | |
| """AI Response Evaluation Environment Client.""" | |
| from typing import Dict | |
| from openenv.core import EnvClient | |
| from openenv.core.client_types import StepResult | |
| from openenv.core.env_server.types import State | |
| from .models import CodeAssessmentAction, CodeAssessmentObservation | |
| class CodeAssessmentEnv( | |
| EnvClient[CodeAssessmentAction, CodeAssessmentObservation, State] | |
| ): | |
| """ | |
| Client for the AI Response Evaluation Environment. | |
| Example: | |
| >>> env = await CodeAssessmentEnv.from_docker_image("code_assessment_env:latest") | |
| >>> result = await env.reset() | |
| >>> print(result.observation.task_type) | |
| >>> result = await env.step(CodeAssessmentAction(answer="incorrect, factual-error")) | |
| """ | |
| def _step_payload(self, action: CodeAssessmentAction) -> Dict: | |
| return {"answer": action.answer} | |
| def _parse_result(self, payload: Dict) -> StepResult[CodeAssessmentObservation]: | |
| obs_data = payload.get("observation", {}) | |
| observation = CodeAssessmentObservation( | |
| problem_description=obs_data.get("problem_description", ""), | |
| difficulty=obs_data.get("difficulty", "easy"), | |
| test_case_input=obs_data.get("test_case_input", ""), | |
| task_type=obs_data.get("task_type", "correctness_check"), | |
| language=obs_data.get("language", "en"), | |
| user_age=obs_data.get("user_age"), | |
| user_mood=obs_data.get("user_mood"), | |
| user_context=obs_data.get("user_context"), | |
| expected_output=obs_data.get("expected_output"), | |
| feedback=obs_data.get("feedback", ""), | |
| is_correct=obs_data.get("is_correct", False), | |
| partial_credit=obs_data.get("partial_credit", 0.0), | |
| problems_solved=obs_data.get("problems_solved", 0), | |
| current_streak=obs_data.get("current_streak", 0), | |
| done=payload.get("done", False), | |
| reward=payload.get("reward"), | |
| metadata=obs_data.get("metadata", {}), | |
| ) | |
| return StepResult( | |
| observation=observation, | |
| reward=payload.get("reward"), | |
| done=payload.get("done", False), | |
| ) | |
| def _parse_state(self, payload: Dict) -> State: | |
| return State( | |
| episode_id=payload.get("episode_id"), | |
| step_count=payload.get("step_count", 0), | |
| ) | |