Gymnasium/gym/vector/tests/test_vector_env.py

import pytest
import numpy as np

from gym.vector.tests.utils import make_env

from gym.vector.async_vector_env import AsyncVectorEnv
from gym.vector.sync_vector_env import SyncVectorEnv

@pytest.mark.parametrize('shared_memory', [True, False])
def test_vector_env_equal(shared_memory):
    env_fns = [make_env('CubeCrash-v0', i) for i in range(4)]
    num_steps = 100
    try:
        async_env = AsyncVectorEnv(env_fns, shared_memory=shared_memory)
        sync_env = SyncVectorEnv(env_fns)

        async_env.seed(0)
        sync_env.seed(0)

        assert async_env.num_envs == sync_env.num_envs
        assert async_env.observation_space == sync_env.observation_space
        assert async_env.single_observation_space == sync_env.single_observation_space
        assert async_env.action_space == sync_env.action_space
        assert async_env.single_action_space == sync_env.single_action_space

        async_observations = async_env.reset()
        sync_observations = sync_env.reset()
        assert np.all(async_observations == sync_observations)

        for _ in range(num_steps):
            actions = async_env.action_space.sample()
            assert actions in sync_env.action_space

            async_observations, async_rewards, async_dones, _ = async_env.step(actions)
            sync_observations, sync_rewards, sync_dones, _ = sync_env.step(actions)

            assert np.all(async_observations == sync_observations)
            assert np.all(async_rewards == sync_rewards)
            assert np.all(async_dones == sync_dones)

    finally:
        async_env.close()
        sync_env.close()
Vectorized environments (#1513) * Initial version of vectorized environments * Raise an exception in the main process if child process raises an exception * Add list of exposed functions in vector module * Use deepcopy instead of np.copy * Add documentation for vector utils * Add tests for copy in AsyncVectorEnv * Add example in documentation for batch_space * Add cloudpickle dependency in setup.py * Fix __del__ in VectorEnv * Check if all observation spaces are equal in AsyncVectorEnv * Check if all observation spaces are equal in SyncVectorEnv * Fix spaces non equality in SyncVectorEnv for Python 2 * Handle None parameter in create_empty_array * Fix check_observation_space with spaces equality * Raise an exception when operations are out of order in AsyncVectorEnv * Add version requirement for cloudpickle * Use a state instead of binary flags in AsyncVectorEnv * Use numpy.zeros when initializing observations in vectorized environments * Remove poll from public API in AsyncVectorEnv * Remove close_extras from VectorEnv * Add test between AsyncVectorEnv and SyncVectorEnv * Remove close in check_observation_space * Add documentation for seed and close * Refactor exceptions for AsyncVectorEnv * Close pipes if the environment raises an error * Add tests for out of order operations * Change default argument in create_empty_array to np.zeros * Add get_attr and set_attr methods to VectorEnv * Improve consistency in SyncVectorEnv 2019-06-21 17:29:44 -04:00			`import pytest`
			`import numpy as np`

			`from gym.vector.tests.utils import make_env`

			`from gym.vector.async_vector_env import AsyncVectorEnv`
			`from gym.vector.sync_vector_env import SyncVectorEnv`

			`@pytest.mark.parametrize('shared_memory', [True, False])`
			`def test_vector_env_equal(shared_memory):`
			`env_fns = [make_env('CubeCrash-v0', i) for i in range(4)]`
			`num_steps = 100`
			`try:`
			`async_env = AsyncVectorEnv(env_fns, shared_memory=shared_memory)`
			`sync_env = SyncVectorEnv(env_fns)`

			`async_env.seed(0)`
			`sync_env.seed(0)`

			`assert async_env.num_envs == sync_env.num_envs`
			`assert async_env.observation_space == sync_env.observation_space`
			`assert async_env.single_observation_space == sync_env.single_observation_space`
			`assert async_env.action_space == sync_env.action_space`
			`assert async_env.single_action_space == sync_env.single_action_space`

			`async_observations = async_env.reset()`
			`sync_observations = sync_env.reset()`
			`assert np.all(async_observations == sync_observations)`

			`for _ in range(num_steps):`
			`actions = async_env.action_space.sample()`
			`assert actions in sync_env.action_space`

			`async_observations, async_rewards, async_dones, _ = async_env.step(actions)`
			`sync_observations, sync_rewards, sync_dones, _ = sync_env.step(actions)`

			`assert np.all(async_observations == sync_observations)`
			`assert np.all(async_rewards == sync_rewards)`
			`assert np.all(async_dones == sync_dones)`

			`finally:`
			`async_env.close()`
			`sync_env.close()`