Final_Assignment_AWorld

Sleeping

App Files Files Community

Duibonduil commited on Jun 30, 2025

Commit

10b3362

verified ·

1 Parent(s): 236dcf5

Upload 4 files

Browse files

Files changed (4) hide show

examples/tools/gym_tool/actions.py +12 -0
examples/tools/gym_tool/async_openai_gym.py +153 -0
examples/tools/gym_tool/openai_gym.py +153 -0
examples/tools/gym_tool/requirements.txt +2 -0

examples/tools/gym_tool/actions.py ADDED Viewed

	@@ -0,0 +1,12 @@

+# coding: utf-8
+# Copyright (c) 2025 inclusionAI.
+from examples.tools.tool_action import GymAction
+from aworld.core.tool.action_factory import ActionFactory
+from aworld.core.tool.action import ExecutableAction
+@ActionFactory.register(name=GymAction.PLAY.value.name,
+                        desc=GymAction.PLAY.value.desc,
+                        tool_name="openai_gym")
+class Play(ExecutableAction):
+    """"""

examples/tools/gym_tool/async_openai_gym.py ADDED Viewed

	@@ -0,0 +1,153 @@

+# coding: utf-8
+# Copyright (c) 2025 inclusionAI.
+from typing import Dict, Any, Tuple, SupportsFloat, Union, List
+from pydantic import BaseModel
+from aworld.config import ConfigDict
+from examples.tools.tool_action import GymAction
+from aworld.core.common import ActionModel, Observation, ActionResult
+from aworld.core.tool.base import AsyncTool, ToolFactory
+from aworld.utils.import_package import import_packages
+from aworld.tools.utils import build_observation
+class ActionType(object):
+    DISCRETE = 'discrete'
+    CONTINUOUS = 'continuous'
+@ToolFactory.register(name="openai_gym", desc="gym classic control game", asyn=True, supported_action=GymAction)
+class OpenAIGym(AsyncTool):
+    def __init__(self, conf: Union[Dict[str, Any], ConfigDict, BaseModel], **kwargs) -> None:
+        """Gym environment constructor.
+        Args:
+            env_id: gym environment full name
+            wrappers: gym environment wrapper list
+        """
+        import_packages(['pygame', 'gymnasium'])
+        super(OpenAIGym, self).__init__(conf, **kwargs)
+        self.env_id = self.conf.get("env_id")
+        self._render = self.conf.get('render', True)
+        if self._render:
+            kwargs['render_mode'] = self.conf.get('render_mode', True)
+        kwargs.pop('name', None)
+        self.env = self._gym_env_wrappers(self.env_id, self.conf.get("wrappers", []), **kwargs)
+        self.action_space = self.env.action_space
+    async def do_step(self, actions: List[ActionModel], **kwargs) -> Tuple[
+        Observation, SupportsFloat, bool, bool, Dict[str, Any]]:
+        if self._render:
+            await self.render()
+        action = actions[0].params['result']
+        action = OpenAIGym.transform_action(action=action)
+        state, reward, terminal, truncate, info = self.env.step(action)
+        info.update(kwargs)
+        self._finished = terminal
+        action_results = []
+        for _ in actions:
+            action_results.append(ActionResult(content=OpenAIGym.transform_state(state=state), success=True))
+        return (build_observation(observer=self.name(),
+                                  action_result=action_results,
+                                  ability=GymAction.PLAY.value.name,
+                                  content=OpenAIGym.transform_state(state=state),
+                                  env_id=self.env_id,
+                                  done=terminal,
+                                  **kwargs),
+                reward,
+                terminal,
+                truncate,
+                info)
+    async def render(self):
+        return self.env.render()
+    async def close(self):
+        if self.env:
+            self.env.close()
+        self.env = None
+    async def reset(self, *, seed: int | None = None, options: Dict[str, str] | None = None) -> Tuple[
+        Any, Dict[str, Any]]:
+        state = self.env.reset()
+        return build_observation(observer=self.name(),
+                                 ability=GymAction.PLAY.value.name,
+                                 content=OpenAIGym.transform_state(state=state),
+                                 env_id=self.env_id,
+                                 done=False), {}
+    def _action_dim(self):
+        from gymnasium import spaces
+        if isinstance(self.env.action_space, spaces.Discrete):
+            self.action_type = ActionType.DISCRETE
+            return self.env.action_space.n
+        elif isinstance(self.env.action_space, spaces.Box):
+            self.action_type = ActionType.CONTINUOUS
+            return self.env.action_space.shape[0]
+        else:
+            raise Exception('unsupported env.action_space: {}'.format(self.env.action_space))
+    def _state_dim(self):
+        if len(self.env.observation_space.shape) == 1:
+            return self.env.observation_space.shape[0]
+        else:
+            raise Exception('unsupported observation_space.shape: {}'.format(self.env.observation_space))
+    def _gym_env_wrappers(self, env_id, wrappers: list = [], **kwargs):
+        import gymnasium
+        env = gymnasium.make(env_id, **kwargs)
+        if wrappers:
+            for wrapper in wrappers:
+                env = wrapper(env)
+        return env
+    @staticmethod
+    def transform_state(state: Any):
+        if isinstance(state, tuple):
+            states = dict()
+            for n, state in enumerate(state):
+                state = OpenAIGym.transform_state(state=state)
+                if isinstance(state, dict):
+                    for name, state in state.items():
+                        states['gym{}-{}'.format(n, name)] = state
+                else:
+                    states['gym{}'.format(n)] = state
+            return states
+        elif isinstance(state, dict):
+            states = dict()
+            for state_name, state in state.items():
+                state = OpenAIGym.transform_state(state=state)
+                if isinstance(state, dict):
+                    for name, state in state.items():
+                        states['{}-{}'.format(state_name, name)] = state
+                else:
+                    states['{}'.format(state_name)] = state
+            return states
+        else:
+            return state
+    @staticmethod
+    def transform_action(action: Any):
+        if not isinstance(action, dict):
+            return action
+        else:
+            actions = dict()
+            for name, action in action.items():
+                if '-' in name:
+                    name, inner_name = name.split('-', 1)
+                    if name not in actions:
+                        actions[name] = dict()
+                    actions[name][inner_name] = action
+                else:
+                    actions[name] = action
+            for name, action in actions.items():
+                if isinstance(action, dict):
+                    actions[name] = OpenAIGym.transform_action(action=action)
+            return actions

examples/tools/gym_tool/openai_gym.py ADDED Viewed

	@@ -0,0 +1,153 @@

+# coding: utf-8
+# Copyright (c) 2025 inclusionAI.
+from typing import Dict, Any, Tuple, SupportsFloat, List, Union
+from aworld.config import ConfigDict, ToolConfig
+from examples.tools.tool_action import GymAction
+from aworld.core.common import Observation, ActionModel, ActionResult
+from aworld.core.tool.base import Tool, ToolFactory
+from aworld.utils.import_package import import_packages
+from aworld.tools.utils import build_observation
+class ActionType(object):
+    DISCRETE = 'discrete'
+    CONTINUOUS = 'continuous'
+@ToolFactory.register(name="openai_gym",
+                      desc="gym classic control game",
+                      supported_action=GymAction,
+                      conf_file_name=f'openai_gym_tool.yaml')
+class OpenAIGym(Tool):
+    def __init__(self, conf: Union[Dict[str, Any], ConfigDict, ToolConfig], **kwargs) -> None:
+        """Gym environment constructor.
+        Args:
+            env_id: gym environment full name
+            wrappers: gym environment wrapper list
+        """
+        import_packages(['pygame', 'gymnasium'])
+        super(OpenAIGym, self).__init__(conf, **kwargs)
+        self.env_id = self.conf.get("env_id")
+        self._render = self.conf.get('render', True)
+        if self._render:
+            kwargs['render_mode'] = self.conf.get('render_mode', 'human')
+        kwargs.pop('name', None)
+        self.env = self._gym_env_wrappers(self.env_id, self.conf.get("wrappers", []), **kwargs)
+        self.action_space = self.env.action_space
+    def do_step(self, actions: List[ActionModel], **kwargs) -> Tuple[
+        Observation, SupportsFloat, bool, bool, Dict[str, Any]]:
+        if self._render:
+            self.render()
+        action = actions[0].params['result']
+        action = OpenAIGym.transform_action(action=action)
+        state, reward, terminal, truncate, info = self.env.step(action)
+        info.update(kwargs)
+        self._finished = terminal
+        action_results = []
+        for _ in actions:
+            action_results.append(ActionResult(content=OpenAIGym.transform_state(state=state), success=True))
+        return (build_observation(observer=self.name(),
+                                  action_result=action_results,
+                                  ability=GymAction.PLAY.value.name,
+                                  content=OpenAIGym.transform_state(state=state),
+                                  env_id=self.env_id,
+                                  done=terminal,
+                                  **kwargs),
+                reward,
+                terminal,
+                truncate,
+                info)
+    def render(self):
+        return self.env.render()
+    def close(self):
+        if self.env:
+            self.env.close()
+        self.env = None
+    def reset(self, *, seed: int | None = None, options: Dict[str, str] | None = None) -> Tuple[Any, Dict[str, Any]]:
+        state = self.env.reset()
+        return build_observation(observer=self.name(),
+                                 ability=GymAction.PLAY.value.name,
+                                 content=OpenAIGym.transform_state(state=state),
+                                 env_id=self.env_id,
+                                 done=False), {}
+    def _action_dim(self):
+        from gymnasium import spaces
+        if isinstance(self.env.action_space, spaces.Discrete):
+            self.action_type = ActionType.DISCRETE
+            return self.env.action_space.n
+        elif isinstance(self.env.action_space, spaces.Box):
+            self.action_type = ActionType.CONTINUOUS
+            return self.env.action_space.shape[0]
+        else:
+            raise Exception('unsupported env.action_space: {}'.format(self.env.action_space))
+    def _state_dim(self):
+        if len(self.env.observation_space.shape) == 1:
+            return self.env.observation_space.shape[0]
+        else:
+            raise Exception('unsupported observation_space.shape: {}'.format(self.env.observation_space))
+    def _gym_env_wrappers(self, env_id, wrappers: list = [], **kwargs):
+        import gymnasium
+        env = gymnasium.make(env_id, **kwargs)
+        if wrappers:
+            for wrapper in wrappers:
+                env = wrapper(env)
+        return env
+    @staticmethod
+    def transform_state(state: Any):
+        if isinstance(state, tuple):
+            states = dict()
+            for n, state in enumerate(state):
+                state = OpenAIGym.transform_state(state=state)
+                if isinstance(state, dict):
+                    for name, state in state.items():
+                        states['gym{}-{}'.format(n, name)] = state
+                else:
+                    states['gym{}'.format(n)] = state
+            return states
+        elif isinstance(state, dict):
+            states = dict()
+            for state_name, state in state.items():
+                state = OpenAIGym.transform_state(state=state)
+                if isinstance(state, dict):
+                    for name, state in state.items():
+                        states['{}-{}'.format(state_name, name)] = state
+                else:
+                    states['{}'.format(state_name)] = state
+            return states
+        else:
+            return state
+    @staticmethod
+    def transform_action(action: Any):
+        if not isinstance(action, dict):
+            return action
+        else:
+            actions = dict()
+            for name, action in action.items():
+                if '-' in name:
+                    name, inner_name = name.split('-', 1)
+                    if name not in actions:
+                        actions[name] = dict()
+                    actions[name][inner_name] = action
+                else:
+                    actions[name] = action
+            for name, action in actions.items():
+                if isinstance(action, dict):
+                    actions[name] = OpenAIGym.transform_action(action=action)
+            return actions

examples/tools/gym_tool/requirements.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ gymnasium~=1.1.0
2	+ pygame~=2.6.1