Gymnasium/tests/wrappers/test_time_limit.py

import pytest

import gym
from gym.envs.classic_control.pendulum import PendulumEnv
from gym.wrappers import TimeLimit


def test_time_limit_reset_info():
    env = gym.make("CartPole-v1")
    env = TimeLimit(env)
    ob_space = env.observation_space
    obs = env.reset()
    assert ob_space.contains(obs)
    del obs
    obs = env.reset(return_info=False)
    assert ob_space.contains(obs)
    del obs
    obs, info = env.reset(return_info=True)
    assert ob_space.contains(obs)
    assert isinstance(info, dict)


@pytest.mark.parametrize("double_wrap", [False, True])
def test_time_limit_wrapper(double_wrap):
    # The pendulum env does not terminate by default
    # so we are sure termination is only due to timeout
    env = PendulumEnv()
    max_episode_length = 20
    env = TimeLimit(env, max_episode_length)
    if double_wrap:
        # TimeLimit wrapper should not overwrite
        # the TimeLimit.truncated key
        # if it was already set
        env = TimeLimit(env, max_episode_length)
    env.reset()
    done = False
    n_steps = 0
    info = {}
    while not done:
        n_steps += 1
        _, _, done, info = env.step(env.action_space.sample())

    assert n_steps == max_episode_length
    assert "TimeLimit.truncated" in info
    assert info["TimeLimit.truncated"] is True


@pytest.mark.parametrize("double_wrap", [False, True])
def test_termination_on_last_step(double_wrap):
    # Special case: termination at the last timestep
    # but not due to timeout
    env = PendulumEnv()

    def patched_step(_action):
        return env.observation_space.sample(), 0.0, True, {}

    env.step = patched_step

    max_episode_length = 1
    env = TimeLimit(env, max_episode_length)
    if double_wrap:
        env = TimeLimit(env, max_episode_length)
    env.reset()
    _, _, done, info = env.step(env.action_space.sample())
    assert done is True
    assert "TimeLimit.truncated" in info
    assert info["TimeLimit.truncated"] is False
Fix TimeLimit wrapper and add tests (#2888) * Fix TimeLimit wrapper and add tests * Slip test 2022-06-15 15:21:53 +02:00			`import pytest`

Adding return_info argument to reset to allow for optional info dict as a second return value (#2546) * initial draft of optional info dict in reset function, implemented for cartpole, tests seem to be passing * merged core.py * updated return type annotation for reset function in core.py * optional metadata with return_info from reset added for all first party environments, with corresponding tests. Incomplete implementation for wrappers and vector wrappers * removed Optional type for return_info arguments * added tests for return_info to normalize wrapper and sync_vector_env * autoformatted using black * added optional reset metadata tests to several wrappers * added return_info capability to async_vector_env.py and test to verify functionality * added optional return_info test for record_video.py * removed tests for mujoco environments * autoformatted * improved test coverage for optional reset return_info * re-removed unit test envs accidentally reintroduced in merge * removed unnecessary import * changes based on code-review * small fix to core wrapper typing and autoformatted record_epsisode_stats * small change to pass flake8 style 2022-02-06 17:28:27 -06:00			`import gym`
Fix TimeLimit wrapper and add tests (#2888) * Fix TimeLimit wrapper and add tests * Slip test 2022-06-15 15:21:53 +02:00			`from gym.envs.classic_control.pendulum import PendulumEnv`
Adding return_info argument to reset to allow for optional info dict as a second return value (#2546) * initial draft of optional info dict in reset function, implemented for cartpole, tests seem to be passing * merged core.py * updated return type annotation for reset function in core.py * optional metadata with return_info from reset added for all first party environments, with corresponding tests. Incomplete implementation for wrappers and vector wrappers * removed Optional type for return_info arguments * added tests for return_info to normalize wrapper and sync_vector_env * autoformatted using black * added optional reset metadata tests to several wrappers * added return_info capability to async_vector_env.py and test to verify functionality * added optional return_info test for record_video.py * removed tests for mujoco environments * autoformatted * improved test coverage for optional reset return_info * re-removed unit test envs accidentally reintroduced in merge * removed unnecessary import * changes based on code-review * small fix to core wrapper typing and autoformatted record_epsisode_stats * small change to pass flake8 style 2022-02-06 17:28:27 -06:00			`from gym.wrappers import TimeLimit`


			`def test_time_limit_reset_info():`
			`env = gym.make("CartPole-v1")`
			`env = TimeLimit(env)`
			`ob_space = env.observation_space`
			`obs = env.reset()`
			`assert ob_space.contains(obs)`
			`del obs`
			`obs = env.reset(return_info=False)`
			`assert ob_space.contains(obs)`
			`del obs`
			`obs, info = env.reset(return_info=True)`
			`assert ob_space.contains(obs)`
			`assert isinstance(info, dict)`
Fix TimeLimit wrapper and add tests (#2888) * Fix TimeLimit wrapper and add tests * Slip test 2022-06-15 15:21:53 +02:00

			`@pytest.mark.parametrize("double_wrap", [False, True])`
			`def test_time_limit_wrapper(double_wrap):`
			`# The pendulum env does not terminate by default`
			`# so we are sure termination is only due to timeout`
			`env = PendulumEnv()`
			`max_episode_length = 20`
			`env = TimeLimit(env, max_episode_length)`
			`if double_wrap:`
			`# TimeLimit wrapper should not overwrite`
			`# the TimeLimit.truncated key`
			`# if it was already set`
			`env = TimeLimit(env, max_episode_length)`
			`env.reset()`
			`done = False`
			`n_steps = 0`
			`info = {}`
			`while not done:`
			`n_steps += 1`
			`_, _, done, info = env.step(env.action_space.sample())`

			`assert n_steps == max_episode_length`
			`assert "TimeLimit.truncated" in info`
			`assert info["TimeLimit.truncated"] is True`


			`@pytest.mark.parametrize("double_wrap", [False, True])`
			`def test_termination_on_last_step(double_wrap):`
			`# Special case: termination at the last timestep`
			`# but not due to timeout`
			`env = PendulumEnv()`

			`def patched_step(_action):`
			`return env.observation_space.sample(), 0.0, True, {}`

			`env.step = patched_step`

			`max_episode_length = 1`
			`env = TimeLimit(env, max_episode_length)`
			`if double_wrap:`
			`env = TimeLimit(env, max_episode_length)`
			`env.reset()`
			`_, _, done, info = env.step(env.action_space.sample())`
			`assert done is True`
			`assert "TimeLimit.truncated" in info`
			`assert info["TimeLimit.truncated"] is False`