Gymnasium/gym/wrappers/step_api_compatibility.py

"""Implementation of StepAPICompatibility wrapper class for transforming envs between new and old step API."""
import gym
from gym.logger import deprecation
from gym.utils.step_api_compatibility import step_to_new_api, step_to_old_api


class StepAPICompatibility(gym.Wrapper):
    r"""A wrapper which can transform an environment from new step API to old and vice-versa.

    Old step API refers to step() method returning (observation, reward, done, info)
    New step API refers to step() method returning (observation, reward, terminated, truncated, info)
    (Refer to docs for details on the API change)

    This wrapper is to be used to ease transition to new API and for backward compatibility.

    Args:
        env (gym.Env): the env to wrap. Can be in old or new API
        new_step_api (bool): True to use env with new step API, False to use env with old step API. (False by default)

    Examples:
        >>> env = gym.make("CartPole-v1")
        >>> env # wrapper applied by default, set to old API
        <TimeLimit<OrderEnforcing<StepAPICompatibility<CartPoleEnv<CartPole-v1>>>>>
        >>> env = gym.make("CartPole-v1", new_step_api=True) # set to new API
        >>> env = StepAPICompatibility(CustomEnv(), new_step_api=True) # manually using wrapper on unregistered envs

    """

    def __init__(self, env: gym.Env, new_step_api=False):
        """A wrapper which can transform an environment from new step API to old and vice-versa.

        Args:
            env (gym.Env): the env to wrap. Can be in old or new API
            new_step_api (bool): Whether the wrapper's step method outputs two booleans (new API) or one boolean (old API)
        """
        super().__init__(env, new_step_api)
        self.new_step_api = new_step_api
        if not self.new_step_api:
            deprecation(
                "Initializing environment in old step API which returns one bool instead of two. It is recommended to set `new_step_api=True` to use new step API. This will be the default behaviour in future."
            )

    def step(self, action):
        """Steps through the environment, returning 5 or 4 items depending on `new_step_api`.

        Args:
            action: action to step through the environment with

        Returns:
            (observation, reward, terminated, truncated, info) or (observation, reward, done, info)
        """
        step_returns = self.env.step(action)
        if self.new_step_api:
            return step_to_new_api(step_returns)
        else:
            return step_to_old_api(step_returns)
New Step API with terminated, truncated bools instead of done (#2752) 2022-07-10 02:18:06 +05:30			`"""Implementation of StepAPICompatibility wrapper class for transforming envs between new and old step API."""`
			`import gym`
			`from gym.logger import deprecation`
			`from gym.utils.step_api_compatibility import step_to_new_api, step_to_old_api`


			`class StepAPICompatibility(gym.Wrapper):`
			`r"""A wrapper which can transform an environment from new step API to old and vice-versa.`

			`Old step API refers to step() method returning (observation, reward, done, info)`
			`New step API refers to step() method returning (observation, reward, terminated, truncated, info)`
			`(Refer to docs for details on the API change)`

			`This wrapper is to be used to ease transition to new API and for backward compatibility.`

			`Args:`
			`env (gym.Env): the env to wrap. Can be in old or new API`
			`new_step_api (bool): True to use env with new step API, False to use env with old step API. (False by default)`

			`Examples:`
			`>>> env = gym.make("CartPole-v1")`
			`>>> env # wrapper applied by default, set to old API`
			`<TimeLimit<OrderEnforcing<StepAPICompatibility<CartPoleEnv<CartPole-v1>>>>>`
			`>>> env = gym.make("CartPole-v1", new_step_api=True) # set to new API`
			`>>> env = StepAPICompatibility(CustomEnv(), new_step_api=True) # manually using wrapper on unregistered envs`

			`"""`

			`def __init__(self, env: gym.Env, new_step_api=False):`
			`"""A wrapper which can transform an environment from new step API to old and vice-versa.`

			`Args:`
			`env (gym.Env): the env to wrap. Can be in old or new API`
			`new_step_api (bool): Whether the wrapper's step method outputs two booleans (new API) or one boolean (old API)`
			`"""`
			`super().__init__(env, new_step_api)`
			`self.new_step_api = new_step_api`
			`if not self.new_step_api:`
			`deprecation(`
Bug fix, add tests for environment checker and passive environment checker wrapper (#2903) 2022-07-11 02:45:24 +01:00			"Initializing environment in old step API which returns one bool instead of two. It is recommended to set `new_step_api=True` to use new step API. This will be the default behaviour in future."
New Step API with terminated, truncated bools instead of done (#2752) 2022-07-10 02:18:06 +05:30			`)`

			`def step(self, action):`
			"""Steps through the environment, returning 5 or 4 items depending on `new_step_api`.

			`Args:`
			`action: action to step through the environment with`

			`Returns:`
			`(observation, reward, terminated, truncated, info) or (observation, reward, done, info)`
			`"""`
			`step_returns = self.env.step(action)`
			`if self.new_step_api:`
			`return step_to_new_api(step_returns)`
			`else:`
			`return step_to_old_api(step_returns)`