Gymnasium/gymnasium/core.py

"""Core API for Environment, Wrapper, ActionWrapper, RewardWrapper and ObservationWrapper."""
from __future__ import annotations

from typing import TYPE_CHECKING, Any, Generic, SupportsFloat, TypeVar

import numpy as np

from gymnasium import spaces
from gymnasium.utils import seeding


if TYPE_CHECKING:
    from gymnasium.envs.registration import EnvSpec

ObsType = TypeVar("ObsType")
ActType = TypeVar("ActType")
RenderFrame = TypeVar("RenderFrame")


class Env(Generic[ObsType, ActType]):
    r"""The main Gymnasium class for implementing Reinforcement Learning Agents environments.

    The class encapsulates an environment with arbitrary behind-the-scenes dynamics through the :meth:`step` and :meth:`reset` functions.
    An environment can be partially or fully observed by single agents. For multi-agent environments, see PettingZoo.

    The main API methods that users of this class need to know are:

    - :meth:`step` - Updates an environment with actions returning the next agent observation, the reward for taking that actions,
      if the environment has terminated or truncated due to the latest action and information from the environment about the step, i.e. metrics, debug info.
    - :meth:`reset` - Resets the environment to an initial state, required before calling step.
      Returns the first agent observation for an episode and information, i.e. metrics, debug info.
    - :meth:`render` - Renders the environments to help visualise what the agent see, examples modes are "human", "rgb_array", "ansi" for text.
    - :meth:`close` - Closes the environment, important when external software is used, i.e. pygame for rendering, databases

    Environments have additional attributes for users to understand the implementation

    - :attr:`action_space` - The Space object corresponding to valid actions, all valid actions should be contained within the space.
    - :attr:`observation_space` - The Space object corresponding to valid observations, all valid observations should be contained within the space.
    - :attr:`reward_range` - A tuple corresponding to the minimum and maximum possible rewards for an agent over an episode.
      The default reward range is set to :math:`(-\infty,+\infty)`.
    - :attr:`spec` - An environment spec that contains the information used to initialize the environment from :meth:`gymnasium.make`
    - :attr:`metadata` - The metadata of the environment, i.e. render modes, render fps
    - :attr:`np_random` - The random number generator for the environment. This is automatically assigned during
      ``super().reset(seed=seed)`` and when assessing ``self.np_random``.

    .. seealso:: For modifying or extending environments use the :py:class:`gymnasium.Wrapper` class
    """

    # Set this in SOME subclasses
    metadata: dict[str, Any] = {"render_modes": []}
    # define render_mode if your environment supports rendering
    render_mode: str | None = None
    reward_range = (-float("inf"), float("inf"))
    spec: EnvSpec | None = None

    # Set these in ALL subclasses
    action_space: spaces.Space[ActType]
    observation_space: spaces.Space[ObsType]

    # Created
    _np_random: np.random.Generator | None = None

    def step(
        self, action: ActType
    ) -> tuple[ObsType, SupportsFloat, bool, bool, dict[str, Any]]:
        """Run one timestep of the environment's dynamics using the agent actions.

        When the end of an episode is reached (``terminated or truncated``), it is necessary to call :meth:`reset` to
        reset this environment's state for the next episode.

        .. versionchanged:: 0.26

            The Step API was changed removing ``done`` in favor of ``terminated`` and ``truncated`` to make it clearer
            to users when the environment had terminated or truncated which is critical for reinforcement learning
            bootstrapping algorithms.

        Args:
            action (ActType): an action provided by the agent to update the environment state.

        Returns:
            observation (ObsType): An element of the environment's :attr:`observation_space` as the next observation due to the agent actions.
                An example is a numpy array containing the positions and velocities of the pole in CartPole.
            reward (SupportsFloat): The reward as a result of taking the action.
            terminated (bool): Whether the agent reaches the terminal state (as defined under the MDP of the task)
                which can be positive or negative. An example is reaching the goal state or moving into the lava from
                the Sutton and Barton, Gridworld. If true, the user needs to call :meth:`reset`.
            truncated (bool): Whether the truncation condition outside the scope of the MDP is satisfied.
                Typically, this is a timelimit, but could also be used to indicate an agent physically going out of bounds.
                Can be used to end the episode prematurely before a terminal state is reached.
                If true, the user needs to call :meth:`reset`.
            info (dict): Contains auxiliary diagnostic information (helpful for debugging, learning, and logging).
                This might, for instance, contain: metrics that describe the agent's performance state, variables that are
                hidden from observations, or individual reward terms that are combined to produce the total reward.
                In OpenAI Gym <v26, it contains "TimeLimit.truncated" to distinguish truncation and termination,
                however this is deprecated in favour of returning terminated and truncated variables.
            done (bool): (Deprecated) A boolean value for if the episode has ended, in which case further :meth:`step` calls will
                return undefined results. This was removed in OpenAI Gym v26 in favor of terminated and truncated attributes.
                A done signal may be emitted for different reasons: Maybe the task underlying the environment was solved successfully,
                a certain timelimit was exceeded, or the physics simulation has entered an invalid state.
        """
        raise NotImplementedError

    def reset(
        self,
        *,
        seed: int | None = None,
        options: dict[str, Any] | None = None,
    ) -> tuple[ObsType, dict[str, Any]]:  # type: ignore
        """Resets the environment to an initial internal state, returning an initial observation and info.

        This method generates a new starting state often with some randomness to ensure that the agent explores the
        state space and learns a generalised policy about the environment. This randomness can be controlled
        with the ``seed`` parameter otherwise if the environment already has a random number generator and
        :meth:`reset` is called with ``seed=None``, the RNG is not reset.

        Therefore, :meth:`reset` should (in the typical use case) be called with a seed right after initialization and then never again.

        For Custom environments, the first line of :meth:`reset` should be ``super().reset(seed=seed)`` which implements
        the seeding correctly.

        .. versionchanged:: v0.25

            The ``return_info`` parameter was removed and now info is expected to be returned.

        Args:
            seed (optional int): The seed that is used to initialize the environment's PRNG (`np_random`).
                If the environment does not already have a PRNG and ``seed=None`` (the default option) is passed,
                a seed will be chosen from some source of entropy (e.g. timestamp or /dev/urandom).
                However, if the environment already has a PRNG and ``seed=None`` is passed, the PRNG will *not* be reset.
                If you pass an integer, the PRNG will be reset even if it already exists.
                Usually, you want to pass an integer *right after the environment has been initialized and then never again*.
                Please refer to the minimal example above to see this paradigm in action.
            options (optional dict): Additional information to specify how the environment is reset (optional,
                depending on the specific environment)

        Returns:
            observation (ObsType): Observation of the initial state. This will be an element of :attr:`observation_space`
                (typically a numpy array) and is analogous to the observation returned by :meth:`step`.
            info (dictionary):  This dictionary contains auxiliary information complementing ``observation``. It should be analogous to
                the ``info`` returned by :meth:`step`.
        """
        # Initialize the RNG if the seed is manually passed
        if seed is not None:
            self._np_random, seed = seeding.np_random(seed)

    def render(self) -> RenderFrame | list[RenderFrame] | None:
        """Compute the render frames as specified by :attr:`render_mode` during the initialization of the environment.

        The environment's :attr:`metadata` render modes (`env.metadata["render_modes"]`) should contain the possible
        ways to implement the render modes. In addition, list versions for most render modes is achieved through
        `gymnasium.make` which automatically applies a wrapper to collect rendered frames.

        Note:
            As the :attr:`render_mode` is known during ``__init__``, the objects used to render the environment state
            should be initialised in ``__init__``.

        By convention, if the :attr:`render_mode` is:

        - None (default): no render is computed.
        - "human": The environment is continuously rendered in the current display or terminal, usually for human consumption.
          This rendering should occur during :meth:`step` and :meth:`render` doesn't need to be called. Returns ``None``.
        - "rgb_array": Return a single frame representing the current state of the environment.
          A frame is a ``np.ndarray`` with shape ``(x, y, 3)`` representing RGB values for an x-by-y pixel image.
        - "ansi": Return a strings (``str``) or ``StringIO.StringIO`` containing a terminal-style text representation
          for each time step. The text can include newlines and ANSI escape sequences (e.g. for colors).
        - "rgb_array_list" and "ansi_list": List based version of render modes are possible (except Human) through the
          wrapper, :py:class:`gymnasium.wrappers.RenderCollection` that is automatically applied during ``gymnasium.make(..., render_mode="rgb_array_list")``.
          The frames collected are popped after :meth:`render` is called or :meth:`reset`.

        Note:
            Make sure that your class's :attr:`metadata` ``"render_modes"`` key includes the list of supported modes.

        .. versionchanged:: 0.25.0

            The render function was changed to no longer accept parameters, rather these parameters should be specified
            in the environment initialised, i.e., ``gymnasium.make("CartPole-v1", render_mode="human")``
        """
        raise NotImplementedError

    def close(self):
        """After the user has finished using the environment, close contains the code necessary to "clean up" the environment.

        This is critical for closing rendering windows, database or HTTP connections.
        """
        pass

    @property
    def unwrapped(self) -> Env[ObsType, ActType]:
        """Returns the base non-wrapped environment.

        Returns:
            Env: The base non-wrapped :class:`gymnasium.Env` instance
        """
        return self

    @property
    def np_random(self) -> np.random.Generator:
        """Returns the environment's internal :attr:`_np_random` that if not set will initialise with a random seed.

        Returns:
            Instances of `np.random.Generator`
        """
        if self._np_random is None:
            self._np_random, seed = seeding.np_random()
        return self._np_random

    @np_random.setter
    def np_random(self, value: np.random.Generator):
        self._np_random = value

    def __str__(self):
        """Returns a string of the environment with :attr:`spec` id's if :attr:`spec.

        Returns:
            A string identifying the environment
        """
        if self.spec is None:
            return f"<{type(self).__name__} instance>"
        else:
            return f"<{type(self).__name__}<{self.spec.id}>>"

    def __enter__(self):
        """Support with-statement for the environment."""
        return self

    def __exit__(self, *args: Any):
        """Support with-statement for the environment and closes the environment."""
        self.close()
        # propagate exception
        return False


WrapperObsType = TypeVar("WrapperObsType")
WrapperActType = TypeVar("WrapperActType")


class Wrapper(Env[WrapperObsType, WrapperActType]):
    """Wraps a :class:`gymnasium.Env` to allow a modular transformation of the :meth:`step` and :meth:`reset` methods.

    This class is the base class of all wrappers to change the behavior of the underlying environment.
    Wrappers that inherit from this class can modify the :attr:`action_space`, :attr:`observation_space`,
    :attr:`reward_range` and :attr:`metadata` attributes, without changing the underlying environment's attributes.
    Moreover, the behavior of the :meth:`step` and :meth:`reset` methods can be changed by these wrappers.

    Some attributes (:attr:`spec`, :attr:`render_mode`, :attr:`np_random`) will point back to the wrapper's environment
    (i.e. to the corresponding attributes of :attr:`env`).

    Note:
        If you inherit from :class:`Wrapper`, don't forget to call ``super().__init__(env)``
    """

    def __init__(self, env: Env[ObsType, ActType]):
        """Wraps an environment to allow a modular transformation of the :meth:`step` and :meth:`reset` methods.

        Args:
            env: The environment to wrap
        """
        self.env = env

        self._action_space: spaces.Space[WrapperActType] | None = None
        self._observation_space: spaces.Space[WrapperObsType] | None = None
        self._reward_range: tuple[SupportsFloat, SupportsFloat] | None = None
        self._metadata: dict[str, Any] | None = None

    def __getattr__(self, name: str):
        """Returns an attribute with ``name``, unless ``name`` starts with an underscore."""
        if name == "_np_random":
            raise AttributeError(
                "Can't access `_np_random` of a wrapper, use `self.unwrapped._np_random` or `self.np_random`."
            )
        elif name.startswith("_"):
            raise AttributeError(f"accessing private attribute '{name}' is prohibited")
        return getattr(self.env, name)

    @property
    def spec(self) -> EnvSpec | None:
        """Returns the :attr:`Env` :attr:`spec` attribute."""
        return self.env.spec

    @classmethod
    def class_name(cls) -> str:
        """Returns the class name of the wrapper."""
        return cls.__name__

    @property
    def action_space(
        self,
    ) -> spaces.Space[ActType] | spaces.Space[WrapperActType]:
        """Return the :attr:`Env` :attr:`action_space` unless overwritten then the wrapper :attr:`action_space` is used."""
        if self._action_space is None:
            return self.env.action_space
        return self._action_space

    @action_space.setter
    def action_space(self, space: spaces.Space[WrapperActType]):
        self._action_space = space

    @property
    def observation_space(
        self,
    ) -> spaces.Space[ObsType] | spaces.Space[WrapperObsType]:
        """Return the :attr:`Env` :attr:`observation_space` unless overwritten then the wrapper :attr:`observation_space` is used."""
        if self._observation_space is None:
            return self.env.observation_space
        return self._observation_space

    @observation_space.setter
    def observation_space(self, space: spaces.Space[WrapperObsType]):
        self._observation_space = space

    @property
    def reward_range(self) -> tuple[SupportsFloat, SupportsFloat]:
        """Return the :attr:`Env` :attr:`reward_range` unless overwritten then the wrapper :attr:`reward_range` is used."""
        if self._reward_range is None:
            return self.env.reward_range
        return self._reward_range

    @reward_range.setter
    def reward_range(self, value: tuple[SupportsFloat, SupportsFloat]):
        self._reward_range = value

    @property
    def metadata(self) -> dict[str, Any]:
        """Returns the :attr:`Env` :attr:`metadata`."""
        if self._metadata is None:
            return self.env.metadata
        return self._metadata

    @metadata.setter
    def metadata(self, value: dict[str, Any]):
        self._metadata = value

    @property
    def render_mode(self) -> str | None:
        """Returns the :attr:`Env` :attr:`render_mode`."""
        return self.env.render_mode

    @property
    def np_random(self) -> np.random.Generator:
        """Returns the :attr:`Env` :attr:`np_random` attribute."""
        return self.env.np_random

    @np_random.setter
    def np_random(self, value: np.random.Generator):
        self.env.np_random = value

    @property
    def _np_random(self):
        """This code will never be run due to __getattr__ being called prior this.

        It seems that @property overwrites the variable (`_np_random`) meaning that __getattr__ gets called with the missing variable.
        """
        raise AttributeError(
            "Can't access `_np_random` of a wrapper, use `.unwrapped._np_random` or `.np_random`."
        )

    def step(
        self, action: WrapperActType
    ) -> tuple[WrapperObsType, SupportsFloat, bool, bool, dict]:
        """Uses the :meth:`step` of the :attr:`env` that can be overwritten to change the returned data."""
        return self.env.step(action)

    def reset(
        self, *, seed: int | None = None, options: dict[str, Any] | None = None
    ) -> tuple[WrapperObsType, dict[str, Any]]:
        """Uses the :meth:`reset` of the :attr:`env` that can be overwritten to change the returned data."""
        return self.env.reset(seed=seed, options=options)

    def render(self) -> RenderFrame | list[RenderFrame] | None:
        """Uses the :meth:`render` of the :attr:`env` that can be overwritten to change the returned data."""
        return self.env.render()

    def close(self):
        """Closes the wrapper and :attr:`env`."""
        return self.env.close()

    def __str__(self):
        """Returns the wrapper name and the :attr:`env` representation string."""
        return f"<{type(self).__name__}{self.env}>"

    def __repr__(self):
        """Returns the string representation of the wrapper."""
        return str(self)

    @property
    def unwrapped(self) -> Env[ObsType, ActType]:
        """Returns the base environment of the wrapper.

        This will be the bare :class:`gymnasium.Env` environment, underneath all layers of wrappers.
        """
        return self.env.unwrapped


class ObservationWrapper(Wrapper[WrapperObsType, ActType]):
    """Superclass of wrappers that can modify observations using :meth:`observation` for :meth:`reset` and :meth:`step`.

    If you would like to apply a function to only the observation before
    passing it to the learning code, you can simply inherit from :class:`ObservationWrapper` and overwrite the method
    :meth:`observation` to implement that transformation. The transformation defined in that method must be
    reflected by the :attr:`env` observation space. Otherwise, you need to specify the new observation space of the
    wrapper by setting :attr:`self.observation_space` in the :meth:`__init__` method of your wrapper.

    Among others, Gymnasium provides the observation wrapper :class:`TimeAwareObservation`, which adds information about the
    index of the timestep to the observation.
    """

    def __init__(self, env: Env[ObsType, ActType]):
        """Constructor for the observation wrapper."""
        super().__init__(env)

    def reset(
        self, *, seed: int | None = None, options: dict[str, Any] | None = None
    ) -> tuple[WrapperObsType, dict[str, Any]]:
        """Modifies the :attr:`env` after calling :meth:`reset`, returning a modified observation using :meth:`self.observation`."""
        obs, info = self.env.reset(seed=seed, options=options)
        return self.observation(obs), info

    def step(
        self, action: ActType
    ) -> tuple[WrapperObsType, SupportsFloat, bool, bool, dict[str, Any]]:
        """Modifies the :attr:`env` after calling :meth:`step` using :meth:`self.observation` on the returned observations."""
        observation, reward, terminated, truncated, info = self.env.step(action)
        return self.observation(observation), reward, terminated, truncated, info

    def observation(self, observation: ObsType) -> WrapperObsType:
        """Returns a modified observation.

        Args:
            observation: The :attr:`env` observation

        Returns:
            The modified observation
        """
        raise NotImplementedError


class RewardWrapper(Wrapper[ObsType, ActType]):
    """Superclass of wrappers that can modify the returning reward from a step.

    If you would like to apply a function to the reward that is returned by the base environment before
    passing it to learning code, you can simply inherit from :class:`RewardWrapper` and overwrite the method
    :meth:`reward` to implement that transformation.
    This transformation might change the :attr:`reward_range`; to specify the :attr:`reward_range` of your wrapper,
    you can simply define :attr:`self.reward_range` in :meth:`__init__`.
    """

    def __init__(self, env: Env[ObsType, ActType]):
        """Constructor for the Reward wrapper."""
        super().__init__(env)

    def step(
        self, action: ActType
    ) -> tuple[ObsType, SupportsFloat, bool, bool, dict[str, Any]]:
        """Modifies the :attr:`env` :meth:`step` reward using :meth:`self.reward`."""
        observation, reward, terminated, truncated, info = self.env.step(action)
        return observation, self.reward(reward), terminated, truncated, info

    def reward(self, reward: SupportsFloat) -> SupportsFloat:
        """Returns a modified environment ``reward``.

        Args:
            reward: The :attr:`env` :meth:`step` reward

        Returns:
            The modified `reward`
        """
        raise NotImplementedError


class ActionWrapper(Wrapper[ObsType, WrapperActType]):
    """Superclass of wrappers that can modify the action before :meth:`env.step`.

    If you would like to apply a function to the action before passing it to the base environment,
    you can simply inherit from :class:`ActionWrapper` and overwrite the method :meth:`action` to implement
    that transformation. The transformation defined in that method must take values in the base environment’s
    action space. However, its domain might differ from the original action space.
    In that case, you need to specify the new action space of the wrapper by setting :attr:`self.action_space` in
    the :meth:`__init__` method of your wrapper.

    Among others, Gymnasium provides the action wrappers :class:`ClipAction` and :class:`RescaleAction` for clipping and rescaling actions.
    """

    def __init__(self, env: Env[ObsType, ActType]):
        """Constructor for the action wrapper."""
        super().__init__(env)

    def step(
        self, action: WrapperActType
    ) -> tuple[ObsType, SupportsFloat, bool, bool, dict[str, Any]]:
        """Runs the :attr:`env` :meth:`env.step` using the modified ``action`` from :meth:`self.action`."""
        return self.env.step(self.action(action))

    def action(self, action: WrapperActType) -> ActType:
        """Returns a modified action before :meth:`env.step` is called.

        Args:
            action: The original :meth:`step` actions

        Returns:
            The modified actions
        """
        raise NotImplementedError
-												Add Pydocstyle to CI (#2785)

* Added pydocstyle to pre-commit

* Added docstrings for tests and updated the tests for autoreset

* Add pydocstyle exclude folder to allow slowly adding new docstrings

* Add docstrings for setup.py and gym/__init__.py, core.py, error.py and logger.py

* Check that all unwrapped environment are of a particular wrapper type

* Reverted back to import gym.spaces.Space to gym.spaces

* Fixed the __init__.py docstring

* Fixed autoreset autoreset test

* Updated gym __init__.py top docstring

* Remove unnecessary import

* Removed "unused error" and make APIerror deprecated at gym 1.0

* Add pydocstyle description to CONTRIBUTING.md

* Added docstrings section to CONTRIBUTING.md

* Added :meth: and :attr: keywords to docstrings

* Added :meth: and :attr: keywords to docstrings

* Update the step docstring placing the return type in the as a note.

* Updated step return type to include each element

* Update maths notation to reward range

* Fixed infinity maths notation
											
										
										
											2022-05-10 15:35:45 +01:00
+								"""Core API for Environment, Wrapper, ActionWrapper, RewardWrapper and ObservationWrapper."""
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								from __future__ import annotations
 								from typing import TYPE_CHECKING, Any, Generic, SupportsFloat, TypeVar
-												mark abstract methods as abstract (#2158)

Co-authored-by: J K Terry <justinkterry@gmail.com>
											
										
										
											2021-08-05 16:35:07 +02:00
-												removed inline RandomNumberGenerator implementation  (#3022)


											
										
										
											2022-08-22 09:20:28 -04:00
+								import numpy as np
-												Rename to gymnasium

											
										
										
											2022-09-08 10:10:07 +01:00
+								from gymnasium import spaces
 								from gymnasium.utils import seeding
-												Improve closer implementation and docstrings (#126)

* Improve auto close implementation

- Register all envs at initialization time, not just ones created via make
- Simplify names and add more documentation on interface
- Move closer instances into the relevant modules

review-requested: @jietang

* Close environments in the tests

This isn't strictly needed, but means there are fewer Doom
subprocesses hanging around while the tests run.

* Use 4 space indent in comment

* Improve docstrings in core

* Don't pass through args to __new__

The __init__ method gets called once __new__ returns,
so these arguments are either ignored (Python 2) or
result in an error (Python 3). The __init__ method
automatically gets called with the correct arguments.

* Fixup comments

											
										
										
											2016-05-27 12:16:35 -07:00
-												Update and rerun `pre-commit` hooks for better code quality (#179)


											
										
										
											2022-12-04 22:24:02 +08:00
-												Full type hinting (#2942)

* Allows a new RNG to be generated with seed=-1 and updated env_checker to fix bug if environment doesn't use np_random in reset

* Revert "fixed `gym.vector.make` where the checker was being applied in the opposite case than was intended to (#2871)"

This reverts commit 519dfd9117e98e4f52d38064d2b0f79974fb676d.

* Remove bad pushed commits

* Fixed spelling in core.py

* Pins pytest to the last py 3.6 version

* Allow Box automatic scalar shape

* Add test box and change default from () to (1,)

* update Box shape inference with more strict checking

* Update the box shape and add check on the custom Box shape

* Removed incorrect shape type and assert shape code

* Update the Box and associated tests

* Remove all folders and files from pyright exclude

* Revert issues

* Push RedTachyon code review

* Add Python Platform

* Remove play from pyright check

* Fixed CI issues

* remove mujoco env type hinting

* Fixed pixel observation test

* Added some new type hints

* Fixed CI errors

* Fixed CI errors

* Remove play.py from exlucde pyright

* Fixed pyright issues
											
										
										
											2022-07-04 18:19:25 +01:00
+								if TYPE_CHECKING:
-												Rename to gymnasium

											
										
										
											2022-09-08 10:10:07 +01:00
+								    from gymnasium.envs.registration import EnvSpec
-												Full type hinting (#2942)

* Allows a new RNG to be generated with seed=-1 and updated env_checker to fix bug if environment doesn't use np_random in reset

* Revert "fixed `gym.vector.make` where the checker was being applied in the opposite case than was intended to (#2871)"

This reverts commit 519dfd9117e98e4f52d38064d2b0f79974fb676d.

* Remove bad pushed commits

* Fixed spelling in core.py

* Pins pytest to the last py 3.6 version

* Allow Box automatic scalar shape

* Add test box and change default from () to (1,)

* update Box shape inference with more strict checking

* Update the box shape and add check on the custom Box shape

* Removed incorrect shape type and assert shape code

* Update the Box and associated tests

* Remove all folders and files from pyright exclude

* Revert issues

* Push RedTachyon code review

* Add Python Platform

* Remove play from pyright check

* Fixed CI issues

* remove mujoco env type hinting

* Fixed pixel observation test

* Added some new type hints

* Fixed CI errors

* Fixed CI errors

* Remove play.py from exlucde pyright

* Fixed pyright issues
											
										
										
											2022-07-04 18:19:25 +01:00
-												Typing/basics (#2529)

* Typing in gym/envs/registration.py

* Add registration to type checked list

* Adds type hints to space.py

* Typing in gym.core.Env

* Typing in seeding.py

* fixup Typing after rebase

* revert accidental change

* Install dependencies in pyright runner

* fix: can only install dependencies after checkout

* fix: install types in a venv

* fix path

* skip env activation, install directly from venv interpreter

* absolute path to venv

* use central python installation

* skip one more typecheck

* cleanup gh actions .yml

* Add py.typed to signal using sources for typechecking

* black!

Co-authored-by: sj_petterson <sj_petterson@gmail.com>
Co-authored-by: J K Terry <justinkterry@gmail.com>
											
										
										
											2021-12-22 19:12:57 +01:00
+								ObsType = TypeVar("ObsType")
 								ActType = TypeVar("ActType")
-												Render API (#2671)

* add pygame GUI for frozen_lake.py env

* add new line at EOF

* pre-commit reformat

* improve graphics

* new images and dynamic window size

* darker tile borders and fix ICC profile

* pre-commit hook

* adjust elf and stool size

* Update frozen_lake.py

* reformat

* fix #2600

* #2600

* add rgb_array support

* reformat

* test render api change on FrozenLake

* add render support for reset on frozenlake

* add clock on pygame render

* new render api for blackjack

* new render api for cliffwalking

* new render api for Env class

* update reset method, lunar and Env

* fix wrapper

* fix reset lunar

* new render api for box2d envs

* new render api for mujoco envs

* fix bug

* new render api for classic control envs

* fix tests

* add render_mode None for CartPole

* new render api for test fake envs

* pre-commit hook

* fix FrozenLake

* fix FrozenLake

* more render_mode to super - frozenlake

* remove kwargs from frozen_lake new

* pre-commit hook

* add deprecated render method

* add backwards compatibility

* fix test

* add _render

* move pygame.init() (avoid pygame dependency on init)

* fix pygame dependencies

* remove collect_render() maintain multi-behaviours .render()

* add type hints

* fix renderer

* don't call .render() with None

* improve docstring

* add single_rgb_array to all envs

* remove None from metadata["render_modes"]

* add type hints to test_env_checkers

* fix lint

* add comments to renderer

* add comments to single_depth_array and single_state_pixels

* reformat

* add deprecation warnings and env.render_mode declaration

* fix lint

* reformat

* fix tests

* add docs

* fix car racing determinism

* remove warning test envs, customizable modes on renderer

* remove commments and add todo for env_checker

* fix car racing

* replace render mode check with assert

* update new mujoco

* reformat

* reformat

* change metaclass definition

* fix tests

* implement mark suggestions (test, docs, sets)

* check_render

Co-authored-by: J K Terry <jkterry0@gmail.com>
											
										
										
											2022-06-08 00:20:56 +02:00
+								RenderFrame = TypeVar("RenderFrame")
-												Avoid metaclass conflicts when inheriting from gym.Env (#3001)

Using __init_subclass__ instead of metaclass, suggested by PEP 487(introduced in python3.6).
As a result, downstream package can safely inherit from gym.Env and abc.ABC/Protocol/...(classes with metaclass != type), or set their own metaclass without making a intermediate metaclass inherited from custom metaclass and type(gym.Env).
											
										
										
											2022-08-16 23:19:31 +08:00
+								class Env(Generic[ObsType, ActType]):
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								    r"""The main Gymnasium class for implementing Reinforcement Learning Agents environments.
-												Add Pydocstyle to CI (#2785)

* Added pydocstyle to pre-commit

* Added docstrings for tests and updated the tests for autoreset

* Add pydocstyle exclude folder to allow slowly adding new docstrings

* Add docstrings for setup.py and gym/__init__.py, core.py, error.py and logger.py

* Check that all unwrapped environment are of a particular wrapper type

* Reverted back to import gym.spaces.Space to gym.spaces

* Fixed the __init__.py docstring

* Fixed autoreset autoreset test

* Updated gym __init__.py top docstring

* Remove unnecessary import

* Removed "unused error" and make APIerror deprecated at gym 1.0

* Add pydocstyle description to CONTRIBUTING.md

* Added docstrings section to CONTRIBUTING.md

* Added :meth: and :attr: keywords to docstrings

* Added :meth: and :attr: keywords to docstrings

* Update the step docstring placing the return type in the as a note.

* Updated step return type to include each element

* Update maths notation to reward range

* Fixed infinity maths notation
											
										
										
											2022-05-10 15:35:45 +01:00
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								    The class encapsulates an environment with arbitrary behind-the-scenes dynamics through the :meth:`step` and :meth:`reset` functions.
 								    An environment can be partially or fully observed by single agents. For multi-agent environments, see PettingZoo.
-												Update Env docstrings

											
										
										
											2016-04-28 10:33:37 -07:00
 								    The main API methods that users of this class need to know are:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								    - :meth:`step` - Updates an environment with actions returning the next agent observation, the reward for taking that actions,
 								      if the environment has terminated or truncated due to the latest action and information from the environment about the step, i.e. metrics, debug info.
 								    - :meth:`reset` - Resets the environment to an initial state, required before calling step.
 								      Returns the first agent observation for an episode and information, i.e. metrics, debug info.
 								    - :meth:`render` - Renders the environments to help visualise what the agent see, examples modes are "human", "rgb_array", "ansi" for text.
 								    - :meth:`close` - Closes the environment, important when external software is used, i.e. pygame for rendering, databases
 								    Environments have additional attributes for users to understand the implementation
 								    - :attr:`action_space` - The Space object corresponding to valid actions, all valid actions should be contained within the space.
 								    - :attr:`observation_space` - The Space object corresponding to valid observations, all valid observations should be contained within the space.
 								    - :attr:`reward_range` - A tuple corresponding to the minimum and maximum possible rewards for an agent over an episode.
 								      The default reward range is set to :math:`(-\infty,+\infty)`.
 								    - :attr:`spec` - An environment spec that contains the information used to initialize the environment from :meth:`gymnasium.make`
 								    - :attr:`metadata` - The metadata of the environment, i.e. render modes, render fps
 								    - :attr:`np_random` - The random number generator for the environment. This is automatically assigned during
 								      ``super().reset(seed=seed)`` and when assessing ``self.np_random``.
 								    .. seealso:: For modifying or extending environments use the :py:class:`gymnasium.Wrapper` class
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
+								    """
-												Blacken the codebase (#2265)


											
										
										
											2021-07-29 02:26:34 +02:00
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
+								    # Set this in SOME subclasses
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    metadata: dict[str, Any] = {"render_modes": []}
-												Add type annotations for metadata and render_mode (#3007)


											
										
										
											2022-08-01 04:53:41 -07:00
+								    # define render_mode if your environment supports rendering
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    render_mode: str | None = None
-												Blacken the codebase (#2265)


											
										
										
											2021-07-29 02:26:34 +02:00
+								    reward_range = (-float("inf"), float("inf"))
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    spec: EnvSpec | None = None
-												Add close() to Env, add functionality to call close() on exit

											
										
										
											2016-05-15 15:59:02 -07:00
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
+								    # Set these in ALL subclasses
-												Typing/basics (#2529)

* Typing in gym/envs/registration.py

* Add registration to type checked list

* Adds type hints to space.py

* Typing in gym.core.Env

* Typing in seeding.py

* fixup Typing after rebase

* revert accidental change

* Install dependencies in pyright runner

* fix: can only install dependencies after checkout

* fix: install types in a venv

* fix path

* skip env activation, install directly from venv interpreter

* absolute path to venv

* use central python installation

* skip one more typecheck

* cleanup gh actions .yml

* Add py.typed to signal using sources for typechecking

* black!

Co-authored-by: sj_petterson <sj_petterson@gmail.com>
Co-authored-by: J K Terry <justinkterry@gmail.com>
											
										
										
											2021-12-22 19:12:57 +01:00
+								    action_space: spaces.Space[ActType]
 								    observation_space: spaces.Space[ObsType]
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
-												Seeding update (#2422)

* Ditch most of the seeding.py and replace np_random with the numpy default_rng. Let's see if tests pass

* Updated a bunch of RNG calls from the RandomState API to Generator API

* black; didn't expect that, did ya?

* Undo a typo

* blaaack

* More typo fixes

* Fixed setting/getting state in multidiscrete spaces

* Fix typo, fix a test to work with the new sampling

* Correctly (?) pass the randomly generated seed if np_random is called with None as seed

* Convert the Discrete sample to a python int (as opposed to np.int64)

* Remove some redundant imports

* First version of the compatibility layer for old-style RNG. Mainly to trigger tests.

* Removed redundant f-strings

* Style fixes, removing unused imports

* Try to make tests pass by removing atari from the dockerfile

* Try to make tests pass by removing atari from the setup

* Try to make tests pass by removing atari from the setup

* Try to make tests pass by removing atari from the setup

* First attempt at deprecating `env.seed` and supporting `env.reset(seed=seed)` instead. Tests should hopefully pass but throw up a million warnings.

* black; didn't expect that, didya?

* Rename the reset parameter in VecEnvs back to `seed`

* Updated tests to use the new seeding method

* Removed a bunch of old `seed` calls.

Fixed a bug in AsyncVectorEnv

* Stop Discrete envs from doing part of the setup (and using the randomness) in init (as opposed to reset)

* Add explicit seed to wrappers reset

* Remove an accidental return

* Re-add some legacy functions with a warning.

* Use deprecation instead of regular warnings for the newly deprecated methods/functions
											
										
										
											2021-12-08 22:14:15 +01:00
+								    # Created
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    _np_random: np.random.Generator | None = None
-												Typecheck classic control environments (#2589)

* Typecheck classic control environments

* consistent imports + comments

* Don't use seed method

Although this code is exact duplication, we at least don't call deprecated method.

* Update core.py
											
										
										
											2022-02-10 18:24:41 +01:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def step(
 								        self, action: ActType
 								    ) -> tuple[ObsType, SupportsFloat, bool, bool, dict[str, Any]]:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Run one timestep of the environment's dynamics using the agent actions.
-												Seeding update (#2422)

* Ditch most of the seeding.py and replace np_random with the numpy default_rng. Let's see if tests pass

* Updated a bunch of RNG calls from the RandomState API to Generator API

* black; didn't expect that, did ya?

* Undo a typo

* blaaack

* More typo fixes

* Fixed setting/getting state in multidiscrete spaces

* Fix typo, fix a test to work with the new sampling

* Correctly (?) pass the randomly generated seed if np_random is called with None as seed

* Convert the Discrete sample to a python int (as opposed to np.int64)

* Remove some redundant imports

* First version of the compatibility layer for old-style RNG. Mainly to trigger tests.

* Removed redundant f-strings

* Style fixes, removing unused imports

* Try to make tests pass by removing atari from the dockerfile

* Try to make tests pass by removing atari from the setup

* Try to make tests pass by removing atari from the setup

* Try to make tests pass by removing atari from the setup

* First attempt at deprecating `env.seed` and supporting `env.reset(seed=seed)` instead. Tests should hopefully pass but throw up a million warnings.

* black; didn't expect that, didya?

* Rename the reset parameter in VecEnvs back to `seed`

* Updated tests to use the new seeding method

* Removed a bunch of old `seed` calls.

Fixed a bug in AsyncVectorEnv

* Stop Discrete envs from doing part of the setup (and using the randomness) in init (as opposed to reset)

* Add explicit seed to wrappers reset

* Remove an accidental return

* Re-add some legacy functions with a warning.

* Use deprecation instead of regular warnings for the newly deprecated methods/functions
											
										
										
											2021-12-08 22:14:15 +01:00
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        When the end of an episode is reached (``terminated or truncated``), it is necessary to call :meth:`reset` to
 								        reset this environment's state for the next episode.
-												Setter-based approach for the fix (#2626)


											
										
										
											2022-02-18 01:38:22 +01:00
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        .. versionchanged:: 0.26
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								            The Step API was changed removing ``done`` in favor of ``terminated`` and ``truncated`` to make it clearer
 								            to users when the environment had terminated or truncated which is critical for reinforcement learning
 								            bootstrapping algorithms.
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
-												Improve closer implementation and docstrings (#126)

* Improve auto close implementation

- Register all envs at initialization time, not just ones created via make
- Simplify names and add more documentation on interface
- Move closer instances into the relevant modules

review-requested: @jietang

* Close environments in the tests

This isn't strictly needed, but means there are fewer Doom
subprocesses hanging around while the tests run.

* Use 4 space indent in comment

* Improve docstrings in core

* Don't pass through args to __new__

The __init__ method gets called once __new__ returns,
so these arguments are either ignored (Python 2) or
result in an error (Python 3). The __init__ method
automatically gets called with the correct arguments.

* Fixup comments

											
										
										
											2016-05-27 12:16:35 -07:00
+								        Args:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								            action (ActType): an action provided by the agent to update the environment state.
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
-												Improve closer implementation and docstrings (#126)

* Improve auto close implementation

- Register all envs at initialization time, not just ones created via make
- Simplify names and add more documentation on interface
- Move closer instances into the relevant modules

review-requested: @jietang

* Close environments in the tests

This isn't strictly needed, but means there are fewer Doom
subprocesses hanging around while the tests run.

* Use 4 space indent in comment

* Improve docstrings in core

* Don't pass through args to __new__

The __init__ method gets called once __new__ returns,
so these arguments are either ignored (Python 2) or
result in an error (Python 3). The __init__ method
automatically gets called with the correct arguments.

* Fixup comments

											
										
										
											2016-05-27 12:16:35 -07:00
+								        Returns:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								            observation (ObsType): An element of the environment's :attr:`observation_space` as the next observation due to the agent actions.
 								                An example is a numpy array containing the positions and velocities of the pole in CartPole.
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								            reward (SupportsFloat): The reward as a result of taking the action.
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								            terminated (bool): Whether the agent reaches the terminal state (as defined under the MDP of the task)
 								                which can be positive or negative. An example is reaching the goal state or moving into the lava from
 								                the Sutton and Barton, Gridworld. If true, the user needs to call :meth:`reset`.
 								            truncated (bool): Whether the truncation condition outside the scope of the MDP is satisfied.
 								                Typically, this is a timelimit, but could also be used to indicate an agent physically going out of bounds.
 								                Can be used to end the episode prematurely before a terminal state is reached.
 								                If true, the user needs to call :meth:`reset`.
 								            info (dict): Contains auxiliary diagnostic information (helpful for debugging, learning, and logging).
-												New Step API with terminated, truncated bools instead of done (#2752)


											
										
										
											2022-07-10 02:18:06 +05:30
+								                This might, for instance, contain: metrics that describe the agent's performance state, variables that are
 								                hidden from observations, or individual reward terms that are combined to produce the total reward.
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								                In OpenAI Gym <v26, it contains "TimeLimit.truncated" to distinguish truncation and termination,
 								                however this is deprecated in favour of returning terminated and truncated variables.
 								            done (bool): (Deprecated) A boolean value for if the episode has ended, in which case further :meth:`step` calls will
 								                return undefined results. This was removed in OpenAI Gym v26 in favor of terminated and truncated attributes.
 								                A done signal may be emitted for different reasons: Maybe the task underlying the environment was solved successfully,
 								                a certain timelimit was exceeded, or the physics simulation has entered an invalid state.
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
+								        """
-												Cleanup, removal of unmaintained code (#836)

* add dtype to Box

* remove board_game, debugging, safety, parameter_tuning environments

* massive set of breaking changes
- remove python logging module
- _step, _reset, _seed, _close => non underscored method
- remove benchmark and scoring folder

* Improve render("human"), now resizable, closable window.

* get rid of default step and reset in wrappers, so it doesn’t silently fail for people with underscore methods

* CubeCrash unit test environment

* followup fixes

* MemorizeDigits unit test envrionment

* refactored spaces a bit
fixed indentation
disabled test_env_semantics

* fix unit tests

* fixes

* CubeCrash, MemorizeDigits tested

* gym backwards compatibility patch

* gym backwards compatibility, followup fixes

* changelist, add spaces to main namespaces

* undo_logger_setup for backwards compat

* remove configuration.py

											
										
										
											2018-01-25 18:20:14 -08:00
+								        raise NotImplementedError
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
-												Add options to the signature of `env.reset` (#2515)

* First find/replace, now tests

* Fixes to the vector env

* Make seed keyword only in wrappers

* (try to) fix the bug with old environments using new wrappers (with the seed keyword)

* black

* Change **kwargs to options, try to make it work; black

* Add OrderEnforcing wrapper to wrapper exports
Add a test for compatibility with old (pybullet-like) envs

* Add OrderEnforcing wrapper to wrapper exports
Add a test for compatibility with old (pybullet-like) envs
black

* Update the env checker

* Update the env checker

* Update the env checker to use inspect (might fail tests, let's see)

* Allow the signature to include kwargs in env_checker

* Minor fix
											
										
										
											2022-01-19 23:28:59 +01:00
+								    def reset(
-												Adding return_info argument to reset to allow for optional info dict as a second return value (#2546)

* initial draft of optional info dict in reset function, implemented for cartpole, tests seem to be passing

* merged core.py

* updated return type annotation for reset function in core.py

* optional metadata with return_info from reset added for all first party environments, with corresponding tests. Incomplete implementation for wrappers and vector wrappers

* removed Optional type for return_info arguments

* added tests for return_info to normalize wrapper and sync_vector_env

* autoformatted using black

* added optional reset metadata tests to several wrappers

* added return_info capability to async_vector_env.py and test to verify functionality

* added optional return_info test for record_video.py

* removed tests for mujoco environments

* autoformatted

* improved test coverage for optional reset return_info

* re-removed unit test envs accidentally reintroduced in merge

* removed unnecessary import

* changes based on code-review

* small fix to core wrapper typing and autoformatted record_epsisode_stats

* small change to pass flake8 style
											
										
										
											2022-02-06 17:28:27 -06:00
+								        self,
 								        *,
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								        seed: int | None = None,
 								        options: dict[str, Any] | None = None,
 								    ) -> tuple[ObsType, dict[str, Any]]:  # type: ignore
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Resets the environment to an initial internal state, returning an initial observation and info.
 								        This method generates a new starting state often with some randomness to ensure that the agent explores the
 								        state space and learns a generalised policy about the environment. This randomness can be controlled
 								        with the ``seed`` parameter otherwise if the environment already has a random number generator and
 								        :meth:`reset` is called with ``seed=None``, the RNG is not reset.
-												Add Pydocstyle to CI (#2785)

* Added pydocstyle to pre-commit

* Added docstrings for tests and updated the tests for autoreset

* Add pydocstyle exclude folder to allow slowly adding new docstrings

* Add docstrings for setup.py and gym/__init__.py, core.py, error.py and logger.py

* Check that all unwrapped environment are of a particular wrapper type

* Reverted back to import gym.spaces.Space to gym.spaces

* Fixed the __init__.py docstring

* Fixed autoreset autoreset test

* Updated gym __init__.py top docstring

* Remove unnecessary import

* Removed "unused error" and make APIerror deprecated at gym 1.0

* Add pydocstyle description to CONTRIBUTING.md

* Added docstrings section to CONTRIBUTING.md

* Added :meth: and :attr: keywords to docstrings

* Added :meth: and :attr: keywords to docstrings

* Update the step docstring placing the return type in the as a note.

* Updated step return type to include each element

* Update maths notation to reward range

* Fixed infinity maths notation
											
										
										
											2022-05-10 15:35:45 +01:00
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        Therefore, :meth:`reset` should (in the typical use case) be called with a seed right after initialization and then never again.
 								        For Custom environments, the first line of :meth:`reset` should be ``super().reset(seed=seed)`` which implements
 								        the seeding correctly.
 								        .. versionchanged:: v0.25
 								            The ``return_info`` parameter was removed and now info is expected to be returned.
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
-												fix and complete docstrings to match the documentation page (#2697)


											
										
										
											2022-04-06 20:12:55 +01:00
+								        Args:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								            seed (optional int): The seed that is used to initialize the environment's PRNG (`np_random`).
-												Add Pydocstyle to CI (#2785)

* Added pydocstyle to pre-commit

* Added docstrings for tests and updated the tests for autoreset

* Add pydocstyle exclude folder to allow slowly adding new docstrings

* Add docstrings for setup.py and gym/__init__.py, core.py, error.py and logger.py

* Check that all unwrapped environment are of a particular wrapper type

* Reverted back to import gym.spaces.Space to gym.spaces

* Fixed the __init__.py docstring

* Fixed autoreset autoreset test

* Updated gym __init__.py top docstring

* Remove unnecessary import

* Removed "unused error" and make APIerror deprecated at gym 1.0

* Add pydocstyle description to CONTRIBUTING.md

* Added docstrings section to CONTRIBUTING.md

* Added :meth: and :attr: keywords to docstrings

* Added :meth: and :attr: keywords to docstrings

* Update the step docstring placing the return type in the as a note.

* Updated step return type to include each element

* Update maths notation to reward range

* Fixed infinity maths notation
											
										
										
											2022-05-10 15:35:45 +01:00
+								                If the environment does not already have a PRNG and ``seed=None`` (the default option) is passed,
 								                a seed will be chosen from some source of entropy (e.g. timestamp or /dev/urandom).
 								                However, if the environment already has a PRNG and ``seed=None`` is passed, the PRNG will *not* be reset.
 								                If you pass an integer, the PRNG will be reset even if it already exists.
 								                Usually, you want to pass an integer *right after the environment has been initialized and then never again*.
 								                Please refer to the minimal example above to see this paradigm in action.
 								            options (optional dict): Additional information to specify how the environment is reset (optional,
 								                depending on the specific environment)
-												fix and complete docstrings to match the documentation page (#2697)


											
										
										
											2022-04-06 20:12:55 +01:00
-												Feature/pixel observation wrapper (#1499)

* Implement PixelObservationWrapper

* Change MujocoEnv.render to support custom camera_{name,id}

* Implement tests for PixelObservationWrapper

* Use env.get_pixels instead of direct env.render

* Fix camera_{id,name} check in pixel observation wrapper

* Fix rendering with explicit camera_id

* Add Wrapperget_pixels to allow call to be propagated to wrapped env

* Remove use of unnecessary `get_pixels` method

* Update PixelObservationWrapper to support multiple pixel keys

* Remove unnecessary `rgb_rendering_tracking` argument

* Remove rgb_rendering_tracking logic

											
										
										
											2019-08-23 15:02:33 -07:00
+								        Returns:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								            observation (ObsType): Observation of the initial state. This will be an element of :attr:`observation_space`
-												Add Pydocstyle to CI (#2785)

* Added pydocstyle to pre-commit

* Added docstrings for tests and updated the tests for autoreset

* Add pydocstyle exclude folder to allow slowly adding new docstrings

* Add docstrings for setup.py and gym/__init__.py, core.py, error.py and logger.py

* Check that all unwrapped environment are of a particular wrapper type

* Reverted back to import gym.spaces.Space to gym.spaces

* Fixed the __init__.py docstring

* Fixed autoreset autoreset test

* Updated gym __init__.py top docstring

* Remove unnecessary import

* Removed "unused error" and make APIerror deprecated at gym 1.0

* Add pydocstyle description to CONTRIBUTING.md

* Added docstrings section to CONTRIBUTING.md

* Added :meth: and :attr: keywords to docstrings

* Added :meth: and :attr: keywords to docstrings

* Update the step docstring placing the return type in the as a note.

* Updated step return type to include each element

* Update maths notation to reward range

* Fixed infinity maths notation
											
										
										
											2022-05-10 15:35:45 +01:00
+								                (typically a numpy array) and is analogous to the observation returned by :meth:`step`.
-												Removing return_info argument to env.reset() and deprecated env.seed() function (reset now always returns info) (#2962)

* removed return_info, made info dict mandatory in reset

* tenatively removed deprecated seed api for environments

* added more info type checks to wrapper tests

* formatting/style compliance

* addressed some comments

* polish to address review

* fixed tests after merge, and added a test of the return_info deprecation assertion if found in reset signature

* some organization of env_checker tests, reverted a probably merge error

* added deprecation check for seed function in env

* updated docstring

* removed debug prints, tweaked test_check_seed_deprecation

* changed return_info deprecation check from assertion to warning

* fixes to vector envs, now  should be correctly structured

* added some explanation and typehints for mockup depcreated return info reset function

* re-removed seed function from vector envs

* added explanation to _reset_return_info_type and changed the return statement
											
										
										
											2022-08-23 11:09:54 -04:00
+								            info (dictionary):  This dictionary contains auxiliary information complementing ``observation``. It should be analogous to
-												Add Pydocstyle to CI (#2785)

* Added pydocstyle to pre-commit

* Added docstrings for tests and updated the tests for autoreset

* Add pydocstyle exclude folder to allow slowly adding new docstrings

* Add docstrings for setup.py and gym/__init__.py, core.py, error.py and logger.py

* Check that all unwrapped environment are of a particular wrapper type

* Reverted back to import gym.spaces.Space to gym.spaces

* Fixed the __init__.py docstring

* Fixed autoreset autoreset test

* Updated gym __init__.py top docstring

* Remove unnecessary import

* Removed "unused error" and make APIerror deprecated at gym 1.0

* Add pydocstyle description to CONTRIBUTING.md

* Added docstrings section to CONTRIBUTING.md

* Added :meth: and :attr: keywords to docstrings

* Added :meth: and :attr: keywords to docstrings

* Update the step docstring placing the return type in the as a note.

* Updated step return type to include each element

* Update maths notation to reward range

* Fixed infinity maths notation
											
										
										
											2022-05-10 15:35:45 +01:00
+								                the ``info`` returned by :meth:`step`.
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
+								        """
-												Typecheck classic control environments (#2589)

* Typecheck classic control environments

* consistent imports + comments

* Don't use seed method

Although this code is exact duplication, we at least don't call deprecated method.

* Update core.py
											
										
										
											2022-02-10 18:24:41 +01:00
+								        # Initialize the RNG if the seed is manually passed
 								        if seed is not None:
 								            self._np_random, seed = seeding.np_random(seed)
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def render(self) -> RenderFrame | list[RenderFrame] | None:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Compute the render frames as specified by :attr:`render_mode` during the initialization of the environment.
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        The environment's :attr:`metadata` render modes (`env.metadata["render_modes"]`) should contain the possible
 								        ways to implement the render modes. In addition, list versions for most render modes is achieved through
 								        `gymnasium.make` which automatically applies a wrapper to collect rendered frames.
 								        Note:
 								            As the :attr:`render_mode` is known during ``__init__``, the objects used to render the environment state
 								            should be initialised in ``__init__``.
 								        By convention, if the :attr:`render_mode` is:
-												Render API (#2671)

* add pygame GUI for frozen_lake.py env

* add new line at EOF

* pre-commit reformat

* improve graphics

* new images and dynamic window size

* darker tile borders and fix ICC profile

* pre-commit hook

* adjust elf and stool size

* Update frozen_lake.py

* reformat

* fix #2600

* #2600

* add rgb_array support

* reformat

* test render api change on FrozenLake

* add render support for reset on frozenlake

* add clock on pygame render

* new render api for blackjack

* new render api for cliffwalking

* new render api for Env class

* update reset method, lunar and Env

* fix wrapper

* fix reset lunar

* new render api for box2d envs

* new render api for mujoco envs

* fix bug

* new render api for classic control envs

* fix tests

* add render_mode None for CartPole

* new render api for test fake envs

* pre-commit hook

* fix FrozenLake

* fix FrozenLake

* more render_mode to super - frozenlake

* remove kwargs from frozen_lake new

* pre-commit hook

* add deprecated render method

* add backwards compatibility

* fix test

* add _render

* move pygame.init() (avoid pygame dependency on init)

* fix pygame dependencies

* remove collect_render() maintain multi-behaviours .render()

* add type hints

* fix renderer

* don't call .render() with None

* improve docstring

* add single_rgb_array to all envs

* remove None from metadata["render_modes"]

* add type hints to test_env_checkers

* fix lint

* add comments to renderer

* add comments to single_depth_array and single_state_pixels

* reformat

* add deprecation warnings and env.render_mode declaration

* fix lint

* reformat

* fix tests

* add docs

* fix car racing determinism

* remove warning test envs, customizable modes on renderer

* remove commments and add todo for env_checker

* fix car racing

* replace render mode check with assert

* update new mujoco

* reformat

* reformat

* change metaclass definition

* fix tests

* implement mark suggestions (test, docs, sets)

* check_render

Co-authored-by: J K Terry <jkterry0@gmail.com>
											
										
										
											2022-06-08 00:20:56 +02:00
 								        - None (default): no render is computed.
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        - "human": The environment is continuously rendered in the current display or terminal, usually for human consumption.
 								          This rendering should occur during :meth:`step` and :meth:`render` doesn't need to be called. Returns ``None``.
 								        - "rgb_array": Return a single frame representing the current state of the environment.
 								          A frame is a ``np.ndarray`` with shape ``(x, y, 3)`` representing RGB values for an x-by-y pixel image.
 								        - "ansi": Return a strings (``str``) or ``StringIO.StringIO`` containing a terminal-style text representation
 								          for each time step. The text can include newlines and ANSI escape sequences (e.g. for colors).
 								        - "rgb_array_list" and "ansi_list": List based version of render modes are possible (except Human) through the
 								          wrapper, :py:class:`gymnasium.wrappers.RenderCollection` that is automatically applied during ``gymnasium.make(..., render_mode="rgb_array_list")``.
 								          The frames collected are popped after :meth:`render` is called or :meth:`reset`.
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
 								        Note:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								            Make sure that your class's :attr:`metadata` ``"render_modes"`` key includes the list of supported modes.
 								        .. versionchanged:: 0.25.0
 								            The render function was changed to no longer accept parameters, rather these parameters should be specified
 								            in the environment initialised, i.e., ``gymnasium.make("CartPole-v1", render_mode="human")``
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
+								        """
-												Cleanup, removal of unmaintained code (#836)

* add dtype to Box

* remove board_game, debugging, safety, parameter_tuning environments

* massive set of breaking changes
- remove python logging module
- _step, _reset, _seed, _close => non underscored method
- remove benchmark and scoring folder

* Improve render("human"), now resizable, closable window.

* get rid of default step and reset in wrappers, so it doesn’t silently fail for people with underscore methods

* CubeCrash unit test environment

* followup fixes

* MemorizeDigits unit test envrionment

* refactored spaces a bit
fixed indentation
disabled test_env_semantics

* fix unit tests

* fixes

* CubeCrash, MemorizeDigits tested

* gym backwards compatibility patch

* gym backwards compatibility, followup fixes

* changelist, add spaces to main namespaces

* undo_logger_setup for backwards compat

* remove configuration.py

											
										
										
											2018-01-25 18:20:14 -08:00
+								        raise NotImplementedError
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
-												Add close() to Env, add functionality to call close() on exit

											
										
										
											2016-05-15 15:59:02 -07:00
+								    def close(self):
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """After the user has finished using the environment, close contains the code necessary to "clean up" the environment.
 								        This is critical for closing rendering windows, database or HTTP connections.
 								        """
-												[Update core.py] Remove underscore methods and its deprecation warning (#1320)

* Update core.py

* Update core.py

* Update core.py

* Update core.py

* Update core.py

* Update core.py

											
										
										
											2019-05-03 23:53:31 +02:00
+								        pass
-												Add close() to Env, add functionality to call close() on exit

											
										
										
											2016-05-15 15:59:02 -07:00
-												Don't have envs be aware of wrappers (#296)

You can always achive the same effect by exposing a wrapping function:

def MyEnv():
  return MyWrapper(MyUnwrappedEnv())
											
										
										
											2016-08-17 15:16:45 -07:00
+								    @property
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def unwrapped(self) -> Env[ObsType, ActType]:
 								        """Returns the base non-wrapped environment.
-												Add experimental Wrapper (#276)


											
										
										
											2016-08-11 14:45:52 -07:00
 								        Returns:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								            Env: The base non-wrapped :class:`gymnasium.Env` instance
-												Add experimental Wrapper (#276)


											
										
										
											2016-08-11 14:45:52 -07:00
+								        """
-												remove configure, simplify core.py

											
										
										
											2017-02-26 00:01:00 -08:00
+								        return self
-												Add experimental Wrapper (#276)


											
										
										
											2016-08-11 14:45:52 -07:00
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								    @property
 								    def np_random(self) -> np.random.Generator:
 								        """Returns the environment's internal :attr:`_np_random` that if not set will initialise with a random seed.
 								        Returns:
 								            Instances of `np.random.Generator`
 								        """
 								        if self._np_random is None:
 								            self._np_random, seed = seeding.np_random()
 								        return self._np_random
 								    @np_random.setter
 								    def np_random(self, value: np.random.Generator):
 								        self._np_random = value
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
+								    def __str__(self):
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Returns a string of the environment with :attr:`spec` id's if :attr:`spec.
 								        Returns:
 								            A string identifying the environment
 								        """
-												Make sure env.spec always exists and is valid. (#621)

* Make sure env.spec always exists and is valid. Previously there was an error when you tried to get the string representation of an unregistered env.

* update changelist

											
										
										
											2017-06-16 16:35:03 -07:00
+								        if self.spec is None:
-												Py36+ syntax in gym/*.py: derived by running `pyupgrade --py36-plus gym/*.py` and `flynt gym --ll 120` (#2473)

Co-authored-by: Ilya Kamen <ilya.kamenshchikov@bosch.com>
											
										
										
											2021-11-14 14:50:40 +01:00
+								            return f"<{type(self).__name__} instance>"
-												Make sure env.spec always exists and is valid. (#621)

* Make sure env.spec always exists and is valid. Previously there was an error when you tried to get the string representation of an unregistered env.

* update changelist

											
										
										
											2017-06-16 16:35:03 -07:00
+								        else:
-												Py36+ syntax in gym/*.py: derived by running `pyupgrade --py36-plus gym/*.py` and `flynt gym --ll 120` (#2473)

Co-authored-by: Ilya Kamen <ilya.kamenshchikov@bosch.com>
											
										
										
											2021-11-14 14:50:40 +01:00
+								            return f"<{type(self).__name__}<{self.spec.id}>>"
-												Initial release. Hello world :).

											
										
										
											2016-04-27 08:00:58 -07:00
-												Implement context handler protocol for Env (#1012)

This enables writing
```
import gym

with gym.make(...) as env:
    ...
```
without the need to remember to call `env.close()` later.
											
										
										
											2019-02-25 15:53:58 -08:00
+								    def __enter__(self):
-												Blacken the codebase (#2265)


											
										
										
											2021-07-29 02:26:34 +02:00
+								        """Support with-statement for the environment."""
-												Implement context handler protocol for Env (#1012)

This enables writing
```
import gym

with gym.make(...) as env:
    ...
```
without the need to remember to call `env.close()` later.
											
										
										
											2019-02-25 15:53:58 -08:00
+								        return self
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def __exit__(self, *args: Any):
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Support with-statement for the environment and closes the environment."""
-												Implement context handler protocol for Env (#1012)

This enables writing
```
import gym

with gym.make(...) as env:
    ...
```
without the need to remember to call `env.close()` later.
											
										
										
											2019-02-25 15:53:58 -08:00
+								        self.close()
 								        # propagate exception
 								        return False
-												New robotics environments (#912)


											
										
										
											2018-02-26 17:35:07 +01:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								WrapperObsType = TypeVar("WrapperObsType")
 								WrapperActType = TypeVar("WrapperActType")
 								class Wrapper(Env[WrapperObsType, WrapperActType]):
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								    """Wraps a :class:`gymnasium.Env` to allow a modular transformation of the :meth:`step` and :meth:`reset` methods.
-												Updated Wrapper docs (#173)


											
										
										
											2022-12-03 13:46:11 +01:00
+								    This class is the base class of all wrappers to change the behavior of the underlying environment.
 								    Wrappers that inherit from this class can modify the :attr:`action_space`, :attr:`observation_space`,
 								    :attr:`reward_range` and :attr:`metadata` attributes, without changing the underlying environment's attributes.
 								    Moreover, the behavior of the :meth:`step` and :meth:`reset` methods can be changed by these wrappers.
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
-												Updated Wrapper docs (#173)


											
										
										
											2022-12-03 13:46:11 +01:00
+								    Some attributes (:attr:`spec`, :attr:`render_mode`, :attr:`np_random`) will point back to the wrapper's environment
 								    (i.e. to the corresponding attributes of :attr:`env`).
-												Feature/pixel observation wrapper (#1499)

* Implement PixelObservationWrapper

* Change MujocoEnv.render to support custom camera_{name,id}

* Implement tests for PixelObservationWrapper

* Use env.get_pixels instead of direct env.render

* Fix camera_{id,name} check in pixel observation wrapper

* Fix rendering with explicit camera_id

* Add Wrapperget_pixels to allow call to be propagated to wrapped env

* Remove use of unnecessary `get_pixels` method

* Update PixelObservationWrapper to support multiple pixel keys

* Remove unnecessary `rgb_rendering_tracking` argument

* Remove rgb_rendering_tracking logic

											
										
										
											2019-08-23 15:02:33 -07:00
-												Add Pydocstyle to CI (#2785)

* Added pydocstyle to pre-commit

* Added docstrings for tests and updated the tests for autoreset

* Add pydocstyle exclude folder to allow slowly adding new docstrings

* Add docstrings for setup.py and gym/__init__.py, core.py, error.py and logger.py

* Check that all unwrapped environment are of a particular wrapper type

* Reverted back to import gym.spaces.Space to gym.spaces

* Fixed the __init__.py docstring

* Fixed autoreset autoreset test

* Updated gym __init__.py top docstring

* Remove unnecessary import

* Removed "unused error" and make APIerror deprecated at gym 1.0

* Add pydocstyle description to CONTRIBUTING.md

* Added docstrings section to CONTRIBUTING.md

* Added :meth: and :attr: keywords to docstrings

* Added :meth: and :attr: keywords to docstrings

* Update the step docstring placing the return type in the as a note.

* Updated step return type to include each element

* Update maths notation to reward range

* Fixed infinity maths notation
											
										
										
											2022-05-10 15:35:45 +01:00
+								    Note:
-												Updated Wrapper docs (#173)


											
										
										
											2022-12-03 13:46:11 +01:00
+								        If you inherit from :class:`Wrapper`, don't forget to call ``super().__init__(env)``
-												[Update core.py] Remove underscore methods and its deprecation warning (#1320)

* Update core.py

* Update core.py

* Update core.py

* Update core.py

* Update core.py

* Update core.py

											
										
										
											2019-05-03 23:53:31 +02:00
+								    """
-												Blacken the codebase (#2265)


											
										
										
											2021-07-29 02:26:34 +02:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def __init__(self, env: Env[ObsType, ActType]):
-												Add Pydocstyle to CI (#2785)

* Added pydocstyle to pre-commit

* Added docstrings for tests and updated the tests for autoreset

* Add pydocstyle exclude folder to allow slowly adding new docstrings

* Add docstrings for setup.py and gym/__init__.py, core.py, error.py and logger.py

* Check that all unwrapped environment are of a particular wrapper type

* Reverted back to import gym.spaces.Space to gym.spaces

* Fixed the __init__.py docstring

* Fixed autoreset autoreset test

* Updated gym __init__.py top docstring

* Remove unnecessary import

* Removed "unused error" and make APIerror deprecated at gym 1.0

* Add pydocstyle description to CONTRIBUTING.md

* Added docstrings section to CONTRIBUTING.md

* Added :meth: and :attr: keywords to docstrings

* Added :meth: and :attr: keywords to docstrings

* Update the step docstring placing the return type in the as a note.

* Updated step return type to include each element

* Update maths notation to reward range

* Fixed infinity maths notation
											
										
										
											2022-05-10 15:35:45 +01:00
+								        """Wraps an environment to allow a modular transformation of the :meth:`step` and :meth:`reset` methods.
 								        Args:
 								            env: The environment to wrap
 								        """
-												Tweak Wrapper implementation (#291)

* Tweak README and don't use __new__ for wrapper

The extra 'env' argument means that Wrapper authors with a custom
__init__ need to think about the parent signature anyway, so there's
not as much benefit to adding the more surprising __new__.

* Add support for registering wrappers for the official environment

											
										
										
											2016-08-13 19:24:48 -07:00
+								        self.env = env
-												Forward environment properties to the wrapper (#2373)

* Forward environment properties to the wrapper, fixes #2175

* Add tests for property forwarding in Wrapper

* Rename klass to class_ in test_core
											
										
										
											2021-09-17 18:02:59 -04:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								        self._action_space: spaces.Space[WrapperActType] | None = None
 								        self._observation_space: spaces.Space[WrapperObsType] | None = None
 								        self._reward_range: tuple[SupportsFloat, SupportsFloat] | None = None
 								        self._metadata: dict[str, Any] | None = None
-												Add Monitored wrapper (#434)

* Add WIP Monitored wrapper

* Remove irrelevant render after close monitor test

* py27 compatibility

* Fix test_benchmark

* Move Monitored out of wrappers __init__

* Turn Monitored into a function that returns a Monitor class

* Fix monitor tests

* Remove deprecated test

* Remove deprecated utility

* Prevent duplicate wrapping, add test

* Fix test

* close env in tests to prevent writing to nonexistent file

* Disable semisuper tests

* typo

* Fix failing spec

* Fix monitoring on semisuper tasks

* Allow disabling of duplicate check

* Rename MonitorManager

* Monitored -> Monitor

* Clean up comments

* Remove cruft

											
										
										
											2016-12-23 16:21:42 -08:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def __getattr__(self, name: str):
-												Add Pydocstyle to CI (#2785)

* Added pydocstyle to pre-commit

* Added docstrings for tests and updated the tests for autoreset

* Add pydocstyle exclude folder to allow slowly adding new docstrings

* Add docstrings for setup.py and gym/__init__.py, core.py, error.py and logger.py

* Check that all unwrapped environment are of a particular wrapper type

* Reverted back to import gym.spaces.Space to gym.spaces

* Fixed the __init__.py docstring

* Fixed autoreset autoreset test

* Updated gym __init__.py top docstring

* Remove unnecessary import

* Removed "unused error" and make APIerror deprecated at gym 1.0

* Add pydocstyle description to CONTRIBUTING.md

* Added docstrings section to CONTRIBUTING.md

* Added :meth: and :attr: keywords to docstrings

* Added :meth: and :attr: keywords to docstrings

* Update the step docstring placing the return type in the as a note.

* Updated step return type to include each element

* Update maths notation to reward range

* Fixed infinity maths notation
											
										
										
											2022-05-10 15:35:45 +01:00
+								        """Returns an attribute with ``name``, unless ``name`` starts with an underscore."""
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								        if name == "_np_random":
 								            raise AttributeError(
 								                "Can't access `_np_random` of a wrapper, use `self.unwrapped._np_random` or `self.np_random`."
 								            )
 								        elif name.startswith("_"):
-												make error message on accessing private attributes more representative (#2714)


											
										
										
											2022-03-24 19:10:06 +01:00
+								            raise AttributeError(f"accessing private attribute '{name}' is prohibited")
-												[Update core.py]: support Wrapper for registering global methods with nested wrapping (#1347)

* Update core.py

* Update core.py

											
										
										
											2019-03-25 20:11:53 +01:00
+								        return getattr(self.env, name)
-												add spec property to wrapper to be forwarded to wrapped env. Fixes 1554 (#1574)


											
										
										
											2019-06-28 15:27:43 -07:00
+								    @property
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def spec(self) -> EnvSpec | None:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Returns the :attr:`Env` :attr:`spec` attribute."""
-												add spec property to wrapper to be forwarded to wrapped env. Fixes 1554 (#1574)


											
										
										
											2019-06-28 15:27:43 -07:00
+								        return self.env.spec
-												Add Monitored wrapper (#434)

* Add WIP Monitored wrapper

* Remove irrelevant render after close monitor test

* py27 compatibility

* Fix test_benchmark

* Move Monitored out of wrappers __init__

* Turn Monitored into a function that returns a Monitor class

* Fix monitor tests

* Remove deprecated test

* Remove deprecated utility

* Prevent duplicate wrapping, add test

* Fix test

* close env in tests to prevent writing to nonexistent file

* Disable semisuper tests

* typo

* Fix failing spec

* Fix monitoring on semisuper tasks

* Allow disabling of duplicate check

* Rename MonitorManager

* Monitored -> Monitor

* Clean up comments

* Remove cruft

											
										
										
											2016-12-23 16:21:42 -08:00
+								    @classmethod
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def class_name(cls) -> str:
-												Add Pydocstyle to CI (#2785)

* Added pydocstyle to pre-commit

* Added docstrings for tests and updated the tests for autoreset

* Add pydocstyle exclude folder to allow slowly adding new docstrings

* Add docstrings for setup.py and gym/__init__.py, core.py, error.py and logger.py

* Check that all unwrapped environment are of a particular wrapper type

* Reverted back to import gym.spaces.Space to gym.spaces

* Fixed the __init__.py docstring

* Fixed autoreset autoreset test

* Updated gym __init__.py top docstring

* Remove unnecessary import

* Removed "unused error" and make APIerror deprecated at gym 1.0

* Add pydocstyle description to CONTRIBUTING.md

* Added docstrings section to CONTRIBUTING.md

* Added :meth: and :attr: keywords to docstrings

* Added :meth: and :attr: keywords to docstrings

* Update the step docstring placing the return type in the as a note.

* Updated step return type to include each element

* Update maths notation to reward range

* Fixed infinity maths notation
											
										
										
											2022-05-10 15:35:45 +01:00
+								        """Returns the class name of the wrapper."""
-												Add Monitored wrapper (#434)

* Add WIP Monitored wrapper

* Remove irrelevant render after close monitor test

* py27 compatibility

* Fix test_benchmark

* Move Monitored out of wrappers __init__

* Turn Monitored into a function that returns a Monitor class

* Fix monitor tests

* Remove deprecated test

* Remove deprecated utility

* Prevent duplicate wrapping, add test

* Fix test

* close env in tests to prevent writing to nonexistent file

* Disable semisuper tests

* typo

* Fix failing spec

* Fix monitoring on semisuper tasks

* Allow disabling of duplicate check

* Rename MonitorManager

* Monitored -> Monitor

* Clean up comments

* Remove cruft

											
										
										
											2016-12-23 16:21:42 -08:00
+								        return cls.__name__
-												Forward environment properties to the wrapper (#2373)

* Forward environment properties to the wrapper, fixes #2175

* Add tests for property forwarding in Wrapper

* Rename klass to class_ in test_core
											
										
										
											2021-09-17 18:02:59 -04:00
+								    @property
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def action_space(
 								        self,
 								    ) -> spaces.Space[ActType] | spaces.Space[WrapperActType]:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Return the :attr:`Env` :attr:`action_space` unless overwritten then the wrapper :attr:`action_space` is used."""
-												Forward environment properties to the wrapper (#2373)

* Forward environment properties to the wrapper, fixes #2175

* Add tests for property forwarding in Wrapper

* Rename klass to class_ in test_core
											
										
										
											2021-09-17 18:02:59 -04:00
+								        if self._action_space is None:
 								            return self.env.action_space
 								        return self._action_space
 								    @action_space.setter
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def action_space(self, space: spaces.Space[WrapperActType]):
-												Forward environment properties to the wrapper (#2373)

* Forward environment properties to the wrapper, fixes #2175

* Add tests for property forwarding in Wrapper

* Rename klass to class_ in test_core
											
										
										
											2021-09-17 18:02:59 -04:00
+								        self._action_space = space
 								    @property
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def observation_space(
 								        self,
 								    ) -> spaces.Space[ObsType] | spaces.Space[WrapperObsType]:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Return the :attr:`Env` :attr:`observation_space` unless overwritten then the wrapper :attr:`observation_space` is used."""
-												Forward environment properties to the wrapper (#2373)

* Forward environment properties to the wrapper, fixes #2175

* Add tests for property forwarding in Wrapper

* Rename klass to class_ in test_core
											
										
										
											2021-09-17 18:02:59 -04:00
+								        if self._observation_space is None:
 								            return self.env.observation_space
 								        return self._observation_space
 								    @observation_space.setter
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def observation_space(self, space: spaces.Space[WrapperObsType]):
-												Forward environment properties to the wrapper (#2373)

* Forward environment properties to the wrapper, fixes #2175

* Add tests for property forwarding in Wrapper

* Rename klass to class_ in test_core
											
										
										
											2021-09-17 18:02:59 -04:00
+								        self._observation_space = space
 								    @property
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def reward_range(self) -> tuple[SupportsFloat, SupportsFloat]:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Return the :attr:`Env` :attr:`reward_range` unless overwritten then the wrapper :attr:`reward_range` is used."""
-												Forward environment properties to the wrapper (#2373)

* Forward environment properties to the wrapper, fixes #2175

* Add tests for property forwarding in Wrapper

* Rename klass to class_ in test_core
											
										
										
											2021-09-17 18:02:59 -04:00
+								        if self._reward_range is None:
 								            return self.env.reward_range
 								        return self._reward_range
 								    @reward_range.setter
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def reward_range(self, value: tuple[SupportsFloat, SupportsFloat]):
-												Forward environment properties to the wrapper (#2373)

* Forward environment properties to the wrapper, fixes #2175

* Add tests for property forwarding in Wrapper

* Rename klass to class_ in test_core
											
										
										
											2021-09-17 18:02:59 -04:00
+								        self._reward_range = value
 								    @property
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def metadata(self) -> dict[str, Any]:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Returns the :attr:`Env` :attr:`metadata`."""
-												Forward environment properties to the wrapper (#2373)

* Forward environment properties to the wrapper, fixes #2175

* Add tests for property forwarding in Wrapper

* Rename klass to class_ in test_core
											
										
										
											2021-09-17 18:02:59 -04:00
+								        if self._metadata is None:
 								            return self.env.metadata
 								        return self._metadata
 								    @metadata.setter
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def metadata(self, value: dict[str, Any]):
-												Forward environment properties to the wrapper (#2373)

* Forward environment properties to the wrapper, fixes #2175

* Add tests for property forwarding in Wrapper

* Rename klass to class_ in test_core
											
										
										
											2021-09-17 18:02:59 -04:00
+								        self._metadata = value
-												fix: add render_mode getter to Wrappers (#2884)


											
										
										
											2022-06-13 03:55:24 +02:00
+								    @property
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def render_mode(self) -> str | None:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Returns the :attr:`Env` :attr:`render_mode`."""
-												fix: add render_mode getter to Wrappers (#2884)


											
										
										
											2022-06-13 03:55:24 +02:00
+								        return self.env.render_mode
-												Forwards all np_random assignments to the actual environment and prevent access to the `_np_random` in wrappers (#2857)


											
										
										
											2022-06-06 14:56:51 +01:00
+								    @property
-												removed inline RandomNumberGenerator implementation  (#3022)


											
										
										
											2022-08-22 09:20:28 -04:00
+								    def np_random(self) -> np.random.Generator:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Returns the :attr:`Env` :attr:`np_random` attribute."""
-												Forwards all np_random assignments to the actual environment and prevent access to the `_np_random` in wrappers (#2857)


											
										
										
											2022-06-06 14:56:51 +01:00
+								        return self.env.np_random
 								    @np_random.setter
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def np_random(self, value: np.random.Generator):
-												Forwards all np_random assignments to the actual environment and prevent access to the `_np_random` in wrappers (#2857)


											
										
										
											2022-06-06 14:56:51 +01:00
+								        self.env.np_random = value
 								    @property
 								    def _np_random(self):
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								        """This code will never be run due to __getattr__ being called prior this.
 								        It seems that @property overwrites the variable (`_np_random`) meaning that __getattr__ gets called with the missing variable.
 								        """
-												Forwards all np_random assignments to the actual environment and prevent access to the `_np_random` in wrappers (#2857)


											
										
										
											2022-06-06 14:56:51 +01:00
+								        raise AttributeError(
 								            "Can't access `_np_random` of a wrapper, use `.unwrapped._np_random` or `.np_random`."
 								        )
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def step(
 								        self, action: WrapperActType
 								    ) -> tuple[WrapperObsType, SupportsFloat, bool, bool, dict]:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Uses the :meth:`step` of the :attr:`env` that can be overwritten to change the returned data."""
-												Support only new step API (while retaining compatibility functions)  (#3019)


											
										
										
											2022-08-30 19:41:59 +05:30
+								        return self.env.step(action)
-												Cleanup, removal of unmaintained code (#836)

* add dtype to Box

* remove board_game, debugging, safety, parameter_tuning environments

* massive set of breaking changes
- remove python logging module
- _step, _reset, _seed, _close => non underscored method
- remove benchmark and scoring folder

* Improve render("human"), now resizable, closable window.

* get rid of default step and reset in wrappers, so it doesn’t silently fail for people with underscore methods

* CubeCrash unit test environment

* followup fixes

* MemorizeDigits unit test envrionment

* refactored spaces a bit
fixed indentation
disabled test_env_semantics

* fix unit tests

* fixes

* CubeCrash, MemorizeDigits tested

* gym backwards compatibility patch

* gym backwards compatibility, followup fixes

* changelist, add spaces to main namespaces

* undo_logger_setup for backwards compat

* remove configuration.py

											
										
										
											2018-01-25 18:20:14 -08:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def reset(
 								        self, *, seed: int | None = None, options: dict[str, Any] | None = None
 								    ) -> tuple[WrapperObsType, dict[str, Any]]:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Uses the :meth:`reset` of the :attr:`env` that can be overwritten to change the returned data."""
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								        return self.env.reset(seed=seed, options=options)
-												Add experimental Wrapper (#276)


											
										
										
											2016-08-11 14:45:52 -07:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def render(self) -> RenderFrame | list[RenderFrame] | None:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Uses the :meth:`render` of the :attr:`env` that can be overwritten to change the returned data."""
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								        return self.env.render()
-												Add experimental Wrapper (#276)


											
										
										
											2016-08-11 14:45:52 -07:00
-												Cleanup, removal of unmaintained code (#836)

* add dtype to Box

* remove board_game, debugging, safety, parameter_tuning environments

* massive set of breaking changes
- remove python logging module
- _step, _reset, _seed, _close => non underscored method
- remove benchmark and scoring folder

* Improve render("human"), now resizable, closable window.

* get rid of default step and reset in wrappers, so it doesn’t silently fail for people with underscore methods

* CubeCrash unit test environment

* followup fixes

* MemorizeDigits unit test envrionment

* refactored spaces a bit
fixed indentation
disabled test_env_semantics

* fix unit tests

* fixes

* CubeCrash, MemorizeDigits tested

* gym backwards compatibility patch

* gym backwards compatibility, followup fixes

* changelist, add spaces to main namespaces

* undo_logger_setup for backwards compat

* remove configuration.py

											
										
										
											2018-01-25 18:20:14 -08:00
+								    def close(self):
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Closes the wrapper and :attr:`env`."""
-												[Update core.py] Remove unnecessary parts (#1406)

* Update core.py

* Update core.py

											
										
										
											2019-03-25 18:23:14 +01:00
+								        return self.env.close()
-												Add experimental Wrapper (#276)


											
										
										
											2016-08-11 14:45:52 -07:00
 								    def __str__(self):
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Returns the wrapper name and the :attr:`env` representation string."""
-												Py36+ syntax in gym/*.py: derived by running `pyupgrade --py36-plus gym/*.py` and `flynt gym --ll 120` (#2473)

Co-authored-by: Ilya Kamen <ilya.kamenshchikov@bosch.com>
											
										
										
											2021-11-14 14:50:40 +01:00
+								        return f"<{type(self).__name__}{self.env}>"
-												[WIP] Start adding Filter API (#329)

Expand Wrapper API
											
										
										
											2016-09-04 00:38:03 -07:00
 								    def __repr__(self):
-												Add Pydocstyle to CI (#2785)

* Added pydocstyle to pre-commit

* Added docstrings for tests and updated the tests for autoreset

* Add pydocstyle exclude folder to allow slowly adding new docstrings

* Add docstrings for setup.py and gym/__init__.py, core.py, error.py and logger.py

* Check that all unwrapped environment are of a particular wrapper type

* Reverted back to import gym.spaces.Space to gym.spaces

* Fixed the __init__.py docstring

* Fixed autoreset autoreset test

* Updated gym __init__.py top docstring

* Remove unnecessary import

* Removed "unused error" and make APIerror deprecated at gym 1.0

* Add pydocstyle description to CONTRIBUTING.md

* Added docstrings section to CONTRIBUTING.md

* Added :meth: and :attr: keywords to docstrings

* Added :meth: and :attr: keywords to docstrings

* Update the step docstring placing the return type in the as a note.

* Updated step return type to include each element

* Update maths notation to reward range

* Fixed infinity maths notation
											
										
										
											2022-05-10 15:35:45 +01:00
+								        """Returns the string representation of the wrapper."""
-												[WIP] Start adding Filter API (#329)

Expand Wrapper API
											
										
										
											2016-09-04 00:38:03 -07:00
+								        return str(self)
-												Don't have envs be aware of wrappers (#296)

You can always achive the same effect by exposing a wrapping function:

def MyEnv():
  return MyWrapper(MyUnwrappedEnv())
											
										
										
											2016-08-17 15:16:45 -07:00
 								    @property
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def unwrapped(self) -> Env[ObsType, ActType]:
-												Updated Wrapper docs (#173)


											
										
										
											2022-12-03 13:46:11 +01:00
+								        """Returns the base environment of the wrapper.
 								        This will be the bare :class:`gymnasium.Env` environment, underneath all layers of wrappers.
 								        """
-												remove configure, simplify core.py

											
										
										
											2017-02-26 00:01:00 -08:00
+								        return self.env.unwrapped
-												[WIP] Start adding Filter API (#329)

Expand Wrapper API
											
										
										
											2016-09-04 00:38:03 -07:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								class ObservationWrapper(Wrapper[WrapperObsType, ActType]):
-												Pydocstyle wrappers docstrings  (#2787)


											
										
										
											2022-05-13 13:58:19 +01:00
+								    """Superclass of wrappers that can modify observations using :meth:`observation` for :meth:`reset` and :meth:`step`.
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								    If you would like to apply a function to only the observation before
-												Fix and Update Basic Usage's and Core page (#41)


											
										
										
											2022-10-10 14:19:17 +02:00
+								    passing it to the learning code, you can simply inherit from :class:`ObservationWrapper` and overwrite the method
-												Pydocstyle wrappers docstrings  (#2787)


											
										
										
											2022-05-13 13:58:19 +01:00
+								    :meth:`observation` to implement that transformation. The transformation defined in that method must be
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								    reflected by the :attr:`env` observation space. Otherwise, you need to specify the new observation space of the
 								    wrapper by setting :attr:`self.observation_space` in the :meth:`__init__` method of your wrapper.
-												Pydocstyle wrappers docstrings  (#2787)


											
										
										
											2022-05-13 13:58:19 +01:00
-												Control f chaneg of gym to gymnasium

											
										
										
											2022-09-08 10:58:14 +01:00
+								    Among others, Gymnasium provides the observation wrapper :class:`TimeAwareObservation`, which adds information about the
-												Pydocstyle wrappers docstrings  (#2787)


											
										
										
											2022-05-13 13:58:19 +01:00
+								    index of the timestep to the observation.
 								    """
-												Add Pydocstyle to CI (#2785)

* Added pydocstyle to pre-commit

* Added docstrings for tests and updated the tests for autoreset

* Add pydocstyle exclude folder to allow slowly adding new docstrings

* Add docstrings for setup.py and gym/__init__.py, core.py, error.py and logger.py

* Check that all unwrapped environment are of a particular wrapper type

* Reverted back to import gym.spaces.Space to gym.spaces

* Fixed the __init__.py docstring

* Fixed autoreset autoreset test

* Updated gym __init__.py top docstring

* Remove unnecessary import

* Removed "unused error" and make APIerror deprecated at gym 1.0

* Add pydocstyle description to CONTRIBUTING.md

* Added docstrings section to CONTRIBUTING.md

* Added :meth: and :attr: keywords to docstrings

* Added :meth: and :attr: keywords to docstrings

* Update the step docstring placing the return type in the as a note.

* Updated step return type to include each element

* Update maths notation to reward range

* Fixed infinity maths notation
											
										
										
											2022-05-10 15:35:45 +01:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def __init__(self, env: Env[ObsType, ActType]):
 								        """Constructor for the observation wrapper."""
 								        super().__init__(env)
 								    def reset(
 								        self, *, seed: int | None = None, options: dict[str, Any] | None = None
 								    ) -> tuple[WrapperObsType, dict[str, Any]]:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Modifies the :attr:`env` after calling :meth:`reset`, returning a modified observation using :meth:`self.observation`."""
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								        obs, info = self.env.reset(seed=seed, options=options)
-												Removing return_info argument to env.reset() and deprecated env.seed() function (reset now always returns info) (#2962)

* removed return_info, made info dict mandatory in reset

* tenatively removed deprecated seed api for environments

* added more info type checks to wrapper tests

* formatting/style compliance

* addressed some comments

* polish to address review

* fixed tests after merge, and added a test of the return_info deprecation assertion if found in reset signature

* some organization of env_checker tests, reverted a probably merge error

* added deprecation check for seed function in env

* updated docstring

* removed debug prints, tweaked test_check_seed_deprecation

* changed return_info deprecation check from assertion to warning

* fixes to vector envs, now  should be correctly structured

* added some explanation and typehints for mockup depcreated return info reset function

* re-removed seed function from vector envs

* added explanation to _reset_return_info_type and changed the return statement
											
										
										
											2022-08-23 11:09:54 -04:00
+								        return self.observation(obs), info
-												Cleanup, removal of unmaintained code (#836)

* add dtype to Box

* remove board_game, debugging, safety, parameter_tuning environments

* massive set of breaking changes
- remove python logging module
- _step, _reset, _seed, _close => non underscored method
- remove benchmark and scoring folder

* Improve render("human"), now resizable, closable window.

* get rid of default step and reset in wrappers, so it doesn’t silently fail for people with underscore methods

* CubeCrash unit test environment

* followup fixes

* MemorizeDigits unit test envrionment

* refactored spaces a bit
fixed indentation
disabled test_env_semantics

* fix unit tests

* fixes

* CubeCrash, MemorizeDigits tested

* gym backwards compatibility patch

* gym backwards compatibility, followup fixes

* changelist, add spaces to main namespaces

* undo_logger_setup for backwards compat

* remove configuration.py

											
										
										
											2018-01-25 18:20:14 -08:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def step(
 								        self, action: ActType
 								    ) -> tuple[WrapperObsType, SupportsFloat, bool, bool, dict[str, Any]]:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Modifies the :attr:`env` after calling :meth:`step` using :meth:`self.observation` on the returned observations."""
-												Support only new step API (while retaining compatibility functions)  (#3019)


											
										
										
											2022-08-30 19:41:59 +05:30
+								        observation, reward, terminated, truncated, info = self.env.step(action)
 								        return self.observation(observation), reward, terminated, truncated, info
-												[Update core.py] Remove underscore methods and its deprecation warning (#1320)

* Update core.py

* Update core.py

* Update core.py

* Update core.py

* Update core.py

* Update core.py

											
										
										
											2019-05-03 23:53:31 +02:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def observation(self, observation: ObsType) -> WrapperObsType:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Returns a modified observation.
 								        Args:
 								            observation: The :attr:`env` observation
 								        Returns:
 								            The modified observation
 								        """
-												[Update core.py] Remove underscore methods and its deprecation warning (#1320)

* Update core.py

* Update core.py

* Update core.py

* Update core.py

* Update core.py

* Update core.py

											
										
										
											2019-05-03 23:53:31 +02:00
+								        raise NotImplementedError
-												[WIP] Start adding Filter API (#329)

Expand Wrapper API
											
										
										
											2016-09-04 00:38:03 -07:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								class RewardWrapper(Wrapper[ObsType, ActType]):
-												Pydocstyle wrappers docstrings  (#2787)


											
										
										
											2022-05-13 13:58:19 +01:00
+								    """Superclass of wrappers that can modify the returning reward from a step.
 								    If you would like to apply a function to the reward that is returned by the base environment before
 								    passing it to learning code, you can simply inherit from :class:`RewardWrapper` and overwrite the method
 								    :meth:`reward` to implement that transformation.
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								    This transformation might change the :attr:`reward_range`; to specify the :attr:`reward_range` of your wrapper,
-												Pydocstyle wrappers docstrings  (#2787)


											
										
										
											2022-05-13 13:58:19 +01:00
+								    you can simply define :attr:`self.reward_range` in :meth:`__init__`.
 								    """
-												Cleanup, removal of unmaintained code (#836)

* add dtype to Box

* remove board_game, debugging, safety, parameter_tuning environments

* massive set of breaking changes
- remove python logging module
- _step, _reset, _seed, _close => non underscored method
- remove benchmark and scoring folder

* Improve render("human"), now resizable, closable window.

* get rid of default step and reset in wrappers, so it doesn’t silently fail for people with underscore methods

* CubeCrash unit test environment

* followup fixes

* MemorizeDigits unit test envrionment

* refactored spaces a bit
fixed indentation
disabled test_env_semantics

* fix unit tests

* fixes

* CubeCrash, MemorizeDigits tested

* gym backwards compatibility patch

* gym backwards compatibility, followup fixes

* changelist, add spaces to main namespaces

* undo_logger_setup for backwards compat

* remove configuration.py

											
										
										
											2018-01-25 18:20:14 -08:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def __init__(self, env: Env[ObsType, ActType]):
 								        """Constructor for the Reward wrapper."""
 								        super().__init__(env)
 								    def step(
 								        self, action: ActType
 								    ) -> tuple[ObsType, SupportsFloat, bool, bool, dict[str, Any]]:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Modifies the :attr:`env` :meth:`step` reward using :meth:`self.reward`."""
-												Support only new step API (while retaining compatibility functions)  (#3019)


											
										
										
											2022-08-30 19:41:59 +05:30
+								        observation, reward, terminated, truncated, info = self.env.step(action)
 								        return observation, self.reward(reward), terminated, truncated, info
-												Add non-underscore methods for Wrappers

											
										
										
											2016-09-04 01:44:20 -07:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def reward(self, reward: SupportsFloat) -> SupportsFloat:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Returns a modified environment ``reward``.
 								        Args:
 								            reward: The :attr:`env` :meth:`step` reward
 								        Returns:
 								            The modified `reward`
 								        """
-												[Update core.py] Remove underscore methods and its deprecation warning (#1320)

* Update core.py

* Update core.py

* Update core.py

* Update core.py

* Update core.py

* Update core.py

											
										
										
											2019-05-03 23:53:31 +02:00
+								        raise NotImplementedError
-												[WIP] Start adding Filter API (#329)

Expand Wrapper API
											
										
										
											2016-09-04 00:38:03 -07:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								class ActionWrapper(Wrapper[ObsType, WrapperActType]):
-												Pydocstyle wrappers docstrings  (#2787)


											
										
										
											2022-05-13 13:58:19 +01:00
+								    """Superclass of wrappers that can modify the action before :meth:`env.step`.
 								    If you would like to apply a function to the action before passing it to the base environment,
 								    you can simply inherit from :class:`ActionWrapper` and overwrite the method :meth:`action` to implement
 								    that transformation. The transformation defined in that method must take values in the base environment’s
 								    action space. However, its domain might differ from the original action space.
 								    In that case, you need to specify the new action space of the wrapper by setting :attr:`self.action_space` in
 								    the :meth:`__init__` method of your wrapper.
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								    Among others, Gymnasium provides the action wrappers :class:`ClipAction` and :class:`RescaleAction` for clipping and rescaling actions.
-												Pydocstyle wrappers docstrings  (#2787)


											
										
										
											2022-05-13 13:58:19 +01:00
+								    """
-												[Update core.py] Remove unnecessary parts (#1406)

* Update core.py

* Update core.py

											
										
										
											2019-03-25 18:23:14 +01:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def __init__(self, env: Env[ObsType, ActType]):
 								        """Constructor for the action wrapper."""
 								        super().__init__(env)
 								    def step(
 								        self, action: WrapperActType
 								    ) -> tuple[ObsType, SupportsFloat, bool, bool, dict[str, Any]]:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Runs the :attr:`env` :meth:`env.step` using the modified ``action`` from :meth:`self.action`."""
-												[Update core.py] Remove underscore methods and its deprecation warning (#1320)

* Update core.py

* Update core.py

* Update core.py

* Update core.py

* Update core.py

* Update core.py

											
										
										
											2019-05-03 23:53:31 +02:00
+								        return self.env.step(self.action(action))
-												[WIP] Start adding Filter API (#329)

Expand Wrapper API
											
										
										
											2016-09-04 00:38:03 -07:00
-												Update the type hinting for core.py (#39)


											
										
										
											2022-11-12 10:21:24 +00:00
+								    def action(self, action: WrapperActType) -> ActType:
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        """Returns a modified action before :meth:`env.step` is called.
-												Add non-underscore methods for Wrappers

											
										
										
											2016-09-04 01:44:20 -07:00
-												Updates the Env, Wrapper and Vector API documentation (#48)


											
										
										
											2022-10-12 15:58:01 +01:00
+								        Args:
 								            action: The original :meth:`step` actions
 								        Returns:
 								            The modified actions
 								        """
-												Blacken the codebase (#2265)


											
										
										
											2021-07-29 02:26:34 +02:00
+								        raise NotImplementedError