Source code for genrl.environments.gym_wrapper

from typing import Any

import gym
import numpy as np


[docs]class GymWrapper(gym.Wrapper):
    """
    Wrapper class for all Gym Environments

    :param env: Gym environment name
    :param n_envs: Number of environments. None if not vectorised
    :param parallel: If vectorised, should environments be run through \
serially or parallelly
    :type env: string
    :type n_envs: None, int
    :type parallel: boolean
    """

    def __init__(self, env: gym.Env):
        super(GymWrapper, self).__init__(env)
        self.env = env

        self.observation_space = self.env.observation_space
        self.action_space = self.env.action_space

        self.state = None
        self.action = None
        self.reward = None
        self.done = False
        self.info = {}

    def __getattr__(self, name: str) -> Any:
        """
        All other calls would go to base env
        """
        env = super(GymWrapper, self).__getattribute__("env")
        return getattr(env, name)

    @property
    def obs_shape(self):
        if isinstance(self.env.observation_space, gym.spaces.Discrete):
            obs_shape = (1,)
        elif isinstance(self.env.observation_space, gym.spaces.Box):
            obs_shape = self.env.observation_space.shape
        return obs_shape

    @property
    def action_shape(self):
        if isinstance(self.env.action_space, gym.spaces.Box):
            action_shape = self.env.action_space.shape
        elif isinstance(self.env.action_space, gym.spaces.Discrete):
            action_shape = (1,)
        return action_shape

[docs]    def sample(self) -> np.ndarray:
        """
        Shortcut method to directly sample from environment's action space

        :returns: Random action from action space
        :rtype: NumPy Array
        """
        return self.env.action_space.sample()

[docs]    def render(self, mode: str = "human") -> None:
        """
        Renders all envs in a tiles format similar to baselines.

        :param mode: Can either be 'human' or 'rgb_array'. \
Displays tiled images in 'human' and returns tiled images in 'rgb_array'
        :type mode: string
        """
        self.env.render(mode=mode)

[docs]    def seed(self, seed: int = None) -> None:
        """
        Set environment seed

        :param seed: Value of seed
        :type seed: int
        """
        self.env.seed(seed)

[docs]    def step(self, action: np.ndarray) -> np.ndarray:
        """
        Steps the env through given action

        :param action: Action taken by agent
        :type action: NumPy array
        :returns: Next observation, reward, game status and debugging info
        """
        self.state, self.reward, self.done, self.info = self.env.step(action)
        self.action = action
        return self.state, self.reward, self.done, self.info

[docs]    def reset(self) -> np.ndarray:
        """
        Resets environment

        :returns: Initial state
        """
        return self.env.reset()

[docs]    def close(self) -> None:
        """
        Closes environment
        """
        self.env.close()