Gymnasium/tests/envs/test_envs.py

import pickle
import warnings

import pytest

import gymnasium as gym
from gymnasium.envs.registration import EnvSpec
from gymnasium.utils.env_checker import check_env, data_equivalence
from tests.envs.utils import (
    all_testing_env_specs,
    all_testing_initialised_envs,
    assert_equals,
)

# This runs a smoketest on each official registered env. We may want
# to try also running environments which are not officially registered envs.
PASSIVE_CHECK_IGNORE_WARNING = [
    f"\x1b[33mWARN: {message}\x1b[0m"
    for message in [
        "This version of the mujoco environments depends on the mujoco-py bindings, which are no longer maintained and may stop working. Please upgrade to the v4 versions of the environments (which depend on the mujoco python bindings instead), unless you are trying to precisely replicate previous works).",
        "Initializing environment in done (old) step API which returns one bool instead of two.",
    ]
]

CHECK_ENV_IGNORE_WARNINGS = [
    f"\x1b[33mWARN: {message}\x1b[0m"
    for message in [
        "This version of the mujoco environments depends on the mujoco-py bindings, which are no longer maintained and may stop working. Please upgrade to the v4 versions of the environments (which depend on the mujoco python bindings instead), unless you are trying to precisely replicate previous works).",
        "A Box observation space minimum value is -infinity. This is probably too low.",
        "A Box observation space maximum value is -infinity. This is probably too high.",
        "For Box action spaces, we recommend using a symmetric and normalized space (range=[-1, 1] or [0, 1]). See https://stable-baselines3.readthedocs.io/en/master/guide/rl_tips.html for more information.",
    ]
]


@pytest.mark.parametrize(
    "spec",
    all_testing_env_specs,
    ids=[spec.id for spec in all_testing_env_specs],
)
def test_envs_pass_env_checker(spec):
    """Check that all environments pass the environment checker with no warnings other than the expected."""
    with warnings.catch_warnings(record=True) as caught_warnings:
        env = spec.make(disable_env_checker=True).unwrapped
        check_env(env, skip_render_check=True)

        env.close()

    for warning in caught_warnings:
        if warning.message.args[0] not in CHECK_ENV_IGNORE_WARNINGS:
            raise gym.error.Error(f"Unexpected warning: {warning.message}")


# Note that this precludes running this test in multiple threads.
# However, we probably already can't do multithreading due to some environments.
SEED = 0
NUM_STEPS = 50


@pytest.mark.parametrize(
    "env_spec",
    all_testing_env_specs,
    ids=[env.id for env in all_testing_env_specs],
)
def test_env_determinism_rollout(env_spec: EnvSpec):
    """Run a rollout with two environments and assert equality.

    This test run a rollout of NUM_STEPS steps with two environments
    initialized with the same seed and assert that:

    - observation after first reset are the same
    - same actions are sampled by the two envs
    - observations are contained in the observation space
    - obs, rew, done and info are equals between the two envs
    """
    # Don't check rollout equality if it's a nondeterministic environment.
    if env_spec.nondeterministic is True:
        return

    env_1 = env_spec.make(disable_env_checker=True)
    env_2 = env_spec.make(disable_env_checker=True)

    initial_obs_1, initial_info_1 = env_1.reset(seed=SEED)
    initial_obs_2, initial_info_2 = env_2.reset(seed=SEED)
    assert_equals(initial_obs_1, initial_obs_2)

    env_1.action_space.seed(SEED)

    for time_step in range(NUM_STEPS):
        # We don't evaluate the determinism of actions
        action = env_1.action_space.sample()

        obs_1, rew_1, terminated_1, truncated_1, info_1 = env_1.step(action)
        obs_2, rew_2, terminated_2, truncated_2, info_2 = env_2.step(action)

        assert_equals(obs_1, obs_2, f"[{time_step}] ")
        assert env_1.observation_space.contains(
            obs_1
        )  # obs_2 verified by previous assertion

        assert rew_1 == rew_2, f"[{time_step}] reward 1={rew_1}, reward 2={rew_2}"
        assert (
            terminated_1 == terminated_2
        ), f"[{time_step}] done 1={terminated_1}, done 2={terminated_2}"
        assert (
            truncated_1 == truncated_2
        ), f"[{time_step}] done 1={truncated_1}, done 2={truncated_2}"
        assert_equals(info_1, info_2, f"[{time_step}] ")

        if (
            terminated_1 or truncated_1
        ):  # terminated_2, truncated_2 verified by previous assertion
            env_1.reset(seed=SEED)
            env_2.reset(seed=SEED)

    env_1.close()
    env_2.close()


@pytest.mark.parametrize(
    "env",
    all_testing_initialised_envs,
    ids=[env.spec.id for env in all_testing_initialised_envs if env.spec is not None],
)
def test_pickle_env(env: gym.Env):
    pickled_env = pickle.loads(pickle.dumps(env))

    data_equivalence(env.reset(), pickled_env.reset())

    action = env.action_space.sample()
    data_equivalence(env.step(action), pickled_env.step(action))
    env.close()
    pickled_env.close()
Fix unpickling Box2D and MuJoCo envs (#3025) * Try to fix car racing unpickling * Fix EzPickle for BipedalWalker and LunarLander * Shamelessly steal the pickle-unpickle test from Mark, with slight modifications * CarRacing EzPickle fix * Mujoco ezpickle fix 2022-08-16 18:05:36 +02:00			`import pickle`
Reduce the number of unexpected warnings during testing (#3050) * Initial commit * Remove unnecessary `warnings.simplefilters` * Fix tests for new step API * Fix testing Co-authored-by: Markus28 <montcyril@gmail.com> 2022-08-30 19:47:26 +01:00			`import warnings`
Fix unpickling Box2D and MuJoCo envs (#3025) * Try to fix car racing unpickling * Fix EzPickle for BipedalWalker and LunarLander * Shamelessly steal the pickle-unpickle test from Mark, with slight modifications * CarRacing EzPickle fix * Mujoco ezpickle fix 2022-08-16 18:05:36 +02:00
Improve `pre-commit` workflow (#2602) * feat: add `isort` to `pre-commit` * ci: skip `__init__.py` file for `isort` * ci: make `isort` mandatory in lint pipeline * docs: add a section on Git hooks * ci: check isort diff * fix: isort from master branch * docs: add pre-commit badge * ci: update black + bandit versions * feat: add PR template * refactor: PR template * ci: remove bandit * docs: add Black badge * ci: try to remove all `\|\| true` statements * ci: remove lint_python job - Remove `lint_python` CI job - Move `pyupgrade` job to `pre-commit` workflow * fix: avoid messing with typing * docs: add a note on running `pre-cpmmit` manually * ci: apply `pre-commit` to the whole codebase 2022-03-31 12:50:38 -07:00			`import pytest`
Fix autodetect dtype warnings (#1234) * Fix autodetect dtype warnings * Use warnings module for gym logger * Fix warning in tests 2018-11-29 02:27:27 +01:00
Change import gymnasium to import gymnasium as gym (#20) 2022-09-16 23:41:27 +01:00			`import gymnasium as gym`
Rename to gymnasium 2022-09-08 10:10:07 +01:00			`from gymnasium.envs.registration import EnvSpec`
			`from gymnasium.utils.env_checker import check_env, data_equivalence`
Fix unpickling Box2D and MuJoCo envs (#3025) * Try to fix car racing unpickling * Fix EzPickle for BipedalWalker and LunarLander * Shamelessly steal the pickle-unpickle test from Mark, with slight modifications * CarRacing EzPickle fix * Mujoco ezpickle fix 2022-08-16 18:05:36 +02:00			`from tests.envs.utils import (`
			`all_testing_env_specs,`
			`all_testing_initialised_envs,`
			`assert_equals,`
			`)`
Blacken the codebase (#2265) 2021-07-29 02:26:34 +02:00
Add test skipping to determinism test, add seeding to debugging envs 2016-05-31 00:57:31 -07:00			`# This runs a smoketest on each official registered env. We may want`
Bug fix, add tests for environment checker and passive environment checker wrapper (#2903) 2022-07-11 02:45:24 +01:00			`# to try also running environments which are not officially registered envs.`
			`PASSIVE_CHECK_IGNORE_WARNING = [`
			`f"\x1b[33mWARN: {message}\x1b[0m"`
			`for message in [`
			`"This version of the mujoco environments depends on the mujoco-py bindings, which are no longer maintained and may stop working. Please upgrade to the v4 versions of the environments (which depend on the mujoco python bindings instead), unless you are trying to precisely replicate previous works).",`
Support only new step API (while retaining compatibility functions) (#3019) 2022-08-30 19:41:59 +05:30			`"Initializing environment in done (old) step API which returns one bool instead of two.",`
Bug fix, add tests for environment checker and passive environment checker wrapper (#2903) 2022-07-11 02:45:24 +01:00			`]`
			`]`

			`CHECK_ENV_IGNORE_WARNINGS = [`
			`f"\x1b[33mWARN: {message}\x1b[0m"`
			`for message in [`
			`"This version of the mujoco environments depends on the mujoco-py bindings, which are no longer maintained and may stop working. Please upgrade to the v4 versions of the environments (which depend on the mujoco python bindings instead), unless you are trying to precisely replicate previous works).",`
			`"A Box observation space minimum value is -infinity. This is probably too low.",`
			`"A Box observation space maximum value is -infinity. This is probably too high.",`
			`"For Box action spaces, we recommend using a symmetric and normalized space (range=[-1, 1] or [0, 1]). See https://stable-baselines3.readthedocs.io/en/master/guide/rl_tips.html for more information.",`
			`]`
			`]`
Rewrite env tests (#2867) 2022-06-16 14:29:13 +01:00

Add new MuJoCo bindings (#2762) 2022-05-24 08:47:51 -04:00			`@pytest.mark.parametrize(`
Added atari tests to CI, fixed test_gym_conversion that was failing due to missing ROMs (#87) 2022-11-01 12:55:38 +01:00			`"spec",`
			`all_testing_env_specs,`
			`ids=[spec.id for spec in all_testing_env_specs],`
Add new MuJoCo bindings (#2762) 2022-05-24 08:47:51 -04:00			`)`
Bug fix, add tests for environment checker and passive environment checker wrapper (#2903) 2022-07-11 02:45:24 +01:00			`def test_envs_pass_env_checker(spec):`
			`"""Check that all environments pass the environment checker with no warnings other than the expected."""`
Reduce the number of unexpected warnings during testing (#3050) * Initial commit * Remove unnecessary `warnings.simplefilters` * Fix tests for new step API * Fix testing Co-authored-by: Markus28 <montcyril@gmail.com> 2022-08-30 19:47:26 +01:00			`with warnings.catch_warnings(record=True) as caught_warnings:`
Bug fix, add tests for environment checker and passive environment checker wrapper (#2903) 2022-07-11 02:45:24 +01:00			`env = spec.make(disable_env_checker=True).unwrapped`
Test necessary imports (#146) 2022-12-01 12:18:01 +00:00			`check_env(env, skip_render_check=True)`
Initial release. Hello world :). 2016-04-27 08:00:58 -07:00
Bug fix, add tests for environment checker and passive environment checker wrapper (#2903) 2022-07-11 02:45:24 +01:00			`env.close()`

Reduce the number of unexpected warnings during testing (#3050) * Initial commit * Remove unnecessary `warnings.simplefilters` * Fix tests for new step API * Fix testing Co-authored-by: Markus28 <montcyril@gmail.com> 2022-08-30 19:47:26 +01:00			`for warning in caught_warnings:`
Bug fix, add tests for environment checker and passive environment checker wrapper (#2903) 2022-07-11 02:45:24 +01:00			`if warning.message.args[0] not in CHECK_ENV_IGNORE_WARNINGS:`
Change import gymnasium to import gymnasium as gym (#20) 2022-09-16 23:41:27 +01:00			`raise gym.error.Error(f"Unexpected warning: {warning.message}")`
Improve closer implementation and docstrings (#126) * Improve auto close implementation - Register all envs at initialization time, not just ones created via make - Simplify names and add more documentation on interface - Move closer instances into the relevant modules review-requested: @jietang * Close environments in the tests This isn't strictly needed, but means there are fewer Doom subprocesses hanging around while the tests run. * Use 4 space indent in comment * Improve docstrings in core * Don't pass through args to __new__ The __init__ method gets called once __new__ returns, so these arguments are either ignored (Python 2) or result in an error (Python 3). The __init__ method automatically gets called with the correct arguments. * Fixup comments 2016-05-27 12:16:35 -07:00
Blacken the codebase (#2265) 2021-07-29 02:26:34 +02:00
Rewrite env tests (#2867) 2022-06-16 14:29:13 +01:00			`# Note that this precludes running this test in multiple threads.`
			`# However, we probably already can't do multithreading due to some environments.`
			`SEED = 0`
			`NUM_STEPS = 50`
Adding return_info argument to reset to allow for optional info dict as a second return value (#2546) * initial draft of optional info dict in reset function, implemented for cartpole, tests seem to be passing * merged core.py * updated return type annotation for reset function in core.py * optional metadata with return_info from reset added for all first party environments, with corresponding tests. Incomplete implementation for wrappers and vector wrappers * removed Optional type for return_info arguments * added tests for return_info to normalize wrapper and sync_vector_env * autoformatted using black * added optional reset metadata tests to several wrappers * added return_info capability to async_vector_env.py and test to verify functionality * added optional return_info test for record_video.py * removed tests for mujoco environments * autoformatted * improved test coverage for optional reset return_info * re-removed unit test envs accidentally reintroduced in merge * removed unnecessary import * changes based on code-review * small fix to core wrapper typing and autoformatted record_epsisode_stats * small change to pass flake8 style 2022-02-06 17:28:27 -06:00

Rewrite env tests (#2867) 2022-06-16 14:29:13 +01:00			`@pytest.mark.parametrize(`
Added atari tests to CI, fixed test_gym_conversion that was failing due to missing ROMs (#87) 2022-11-01 12:55:38 +01:00			`"env_spec",`
			`all_testing_env_specs,`
			`ids=[env.id for env in all_testing_env_specs],`
Rewrite env tests (#2867) 2022-06-16 14:29:13 +01:00			`)`
			`def test_env_determinism_rollout(env_spec: EnvSpec):`
			`"""Run a rollout with two environments and assert equality.`

			`This test run a rollout of NUM_STEPS steps with two environments`
			`initialized with the same seed and assert that:`

			`- observation after first reset are the same`
			`- same actions are sampled by the two envs`
			`- observations are contained in the observation space`
			`- obs, rew, done and info are equals between the two envs`
			`"""`
			`# Don't check rollout equality if it's a nondeterministic environment.`
			`if env_spec.nondeterministic is True:`
			`return`

			`env_1 = env_spec.make(disable_env_checker=True)`
			`env_2 = env_spec.make(disable_env_checker=True)`

Removing return_info argument to env.reset() and deprecated env.seed() function (reset now always returns info) (#2962) * removed return_info, made info dict mandatory in reset * tenatively removed deprecated seed api for environments * added more info type checks to wrapper tests * formatting/style compliance * addressed some comments * polish to address review * fixed tests after merge, and added a test of the return_info deprecation assertion if found in reset signature * some organization of env_checker tests, reverted a probably merge error * added deprecation check for seed function in env * updated docstring * removed debug prints, tweaked test_check_seed_deprecation * changed return_info deprecation check from assertion to warning * fixes to vector envs, now should be correctly structured * added some explanation and typehints for mockup depcreated return info reset function * re-removed seed function from vector envs * added explanation to _reset_return_info_type and changed the return statement 2022-08-23 11:09:54 -04:00			`initial_obs_1, initial_info_1 = env_1.reset(seed=SEED)`
			`initial_obs_2, initial_info_2 = env_2.reset(seed=SEED)`
Rewrite env tests (#2867) 2022-06-16 14:29:13 +01:00			`assert_equals(initial_obs_1, initial_obs_2)`

			`env_1.action_space.seed(SEED)`

			`for time_step in range(NUM_STEPS):`
			`# We don't evaluate the determinism of actions`
			`action = env_1.action_space.sample()`

Support only new step API (while retaining compatibility functions) (#3019) 2022-08-30 19:41:59 +05:30			`obs_1, rew_1, terminated_1, truncated_1, info_1 = env_1.step(action)`
			`obs_2, rew_2, terminated_2, truncated_2, info_2 = env_2.step(action)`
Rewrite env tests (#2867) 2022-06-16 14:29:13 +01:00
			`assert_equals(obs_1, obs_2, f"[{time_step}] ")`
			`assert env_1.observation_space.contains(`
			`obs_1`
			`) # obs_2 verified by previous assertion`

			`assert rew_1 == rew_2, f"[{time_step}] reward 1={rew_1}, reward 2={rew_2}"`
Support only new step API (while retaining compatibility functions) (#3019) 2022-08-30 19:41:59 +05:30			`assert (`
			`terminated_1 == terminated_2`
			`), f"[{time_step}] done 1={terminated_1}, done 2={terminated_2}"`
			`assert (`
			`truncated_1 == truncated_2`
			`), f"[{time_step}] done 1={truncated_1}, done 2={truncated_2}"`
Rewrite env tests (#2867) 2022-06-16 14:29:13 +01:00			`assert_equals(info_1, info_2, f"[{time_step}] ")`

Support only new step API (while retaining compatibility functions) (#3019) 2022-08-30 19:41:59 +05:30			`if (`
			`terminated_1 or truncated_1`
			`): # terminated_2, truncated_2 verified by previous assertion`
Rewrite env tests (#2867) 2022-06-16 14:29:13 +01:00			`env_1.reset(seed=SEED)`
			`env_2.reset(seed=SEED)`

			`env_1.close()`
			`env_2.close()`
Adding return_info argument to reset to allow for optional info dict as a second return value (#2546) * initial draft of optional info dict in reset function, implemented for cartpole, tests seem to be passing * merged core.py * updated return type annotation for reset function in core.py * optional metadata with return_info from reset added for all first party environments, with corresponding tests. Incomplete implementation for wrappers and vector wrappers * removed Optional type for return_info arguments * added tests for return_info to normalize wrapper and sync_vector_env * autoformatted using black * added optional reset metadata tests to several wrappers * added return_info capability to async_vector_env.py and test to verify functionality * added optional return_info test for record_video.py * removed tests for mujoco environments * autoformatted * improved test coverage for optional reset return_info * re-removed unit test envs accidentally reintroduced in merge * removed unnecessary import * changes based on code-review * small fix to core wrapper typing and autoformatted record_epsisode_stats * small change to pass flake8 style 2022-02-06 17:28:27 -06:00

Fix unpickling Box2D and MuJoCo envs (#3025) * Try to fix car racing unpickling * Fix EzPickle for BipedalWalker and LunarLander * Shamelessly steal the pickle-unpickle test from Mark, with slight modifications * CarRacing EzPickle fix * Mujoco ezpickle fix 2022-08-16 18:05:36 +02:00			`@pytest.mark.parametrize(`
			`"env",`
			`all_testing_initialised_envs,`
Update the type hinting for core.py (#39) 2022-11-12 10:21:24 +00:00			`ids=[env.spec.id for env in all_testing_initialised_envs if env.spec is not None],`
Fix unpickling Box2D and MuJoCo envs (#3025) * Try to fix car racing unpickling * Fix EzPickle for BipedalWalker and LunarLander * Shamelessly steal the pickle-unpickle test from Mark, with slight modifications * CarRacing EzPickle fix * Mujoco ezpickle fix 2022-08-16 18:05:36 +02:00			`)`
Change import gymnasium to import gymnasium as gym (#20) 2022-09-16 23:41:27 +01:00			`def test_pickle_env(env: gym.Env):`
Fix unpickling Box2D and MuJoCo envs (#3025) * Try to fix car racing unpickling * Fix EzPickle for BipedalWalker and LunarLander * Shamelessly steal the pickle-unpickle test from Mark, with slight modifications * CarRacing EzPickle fix * Mujoco ezpickle fix 2022-08-16 18:05:36 +02:00			`pickled_env = pickle.loads(pickle.dumps(env))`

			`data_equivalence(env.reset(), pickled_env.reset())`

			`action = env.action_space.sample()`
			`data_equivalence(env.step(action), pickled_env.step(action))`
			`env.close()`
			`pickled_env.close()`