| import gym_aloha |
| import gymnasium |
| import numpy as np |
| from openpi_client import image_tools |
| from openpi_client.runtime import environment as _environment |
| from typing_extensions import override |
|
|
|
|
| class AlohaSimEnvironment(_environment.Environment): |
| """An environment for an Aloha robot in simulation.""" |
|
|
| def __init__(self, task: str, obs_type: str = "pixels_agent_pos", seed: int = 0) -> None: |
| np.random.seed(seed) |
| self._rng = np.random.default_rng(seed) |
|
|
| self._gym = gymnasium.make(task, obs_type=obs_type) |
|
|
| self._last_obs = None |
| self._done = True |
| self._episode_reward = 0.0 |
|
|
| @override |
| def reset(self) -> None: |
| gym_obs, _ = self._gym.reset(seed=int(self._rng.integers(2**32 - 1))) |
| self._last_obs = self._convert_observation(gym_obs) |
| self._done = False |
| self._episode_reward = 0.0 |
|
|
| @override |
| def is_episode_complete(self) -> bool: |
| return self._done |
|
|
| @override |
| def get_observation(self) -> dict: |
| if self._last_obs is None: |
| raise RuntimeError("Observation is not set. Call reset() first.") |
|
|
| return self._last_obs |
|
|
| @override |
| def apply_action(self, action: dict) -> None: |
| gym_obs, reward, terminated, truncated, info = self._gym.step(action["actions"]) |
| self._last_obs = self._convert_observation(gym_obs) |
| self._done = terminated or truncated |
| self._episode_reward = max(self._episode_reward, reward) |
|
|
| def _convert_observation(self, gym_obs: dict) -> dict: |
| img = gym_obs["pixels"]["top"] |
| img = image_tools.convert_to_uint8(image_tools.resize_with_pad(img, 224, 224)) |
| |
| img = np.transpose(img, (2, 0, 1)) |
|
|
| return { |
| "state": gym_obs["agent_pos"], |
| "images": {"cam_high": img}, |
| } |
|
|