Gymnasium/gym/envs/tests/test_envs_semantics.py

from __future__ import unicode_literals
import json
import hashlib
import os
import sys

from nose2 import tools
import logging
logger = logging.getLogger(__name__)

from gym import envs, spaces

from gym.envs.tests.test_envs import should_skip_env_spec_for_tests

DATA_DIR = os.path.dirname(__file__)
ROLLOUT_STEPS = 100
episodes = ROLLOUT_STEPS
steps = ROLLOUT_STEPS

ROLLOUT_FILE = os.path.join(DATA_DIR, 'rollout.json')

if not os.path.isfile(ROLLOUT_FILE): 
  with open(ROLLOUT_FILE, "w") as outfile:
    json.dump({}, outfile, indent=2)

def hash_object(unhashed):
  return hashlib.sha256(str(unhashed).encode('utf-16')).hexdigest()

def generate_rollout_hash(spec):
  spaces.seed(0)
  env = spec.make()
  env.seed(0)

  observation_list = []
  action_list = []
  reward_list = []
  done_list = []

  total_steps = 0
  for episode in range(episodes):
    if total_steps >= ROLLOUT_STEPS: break
    observation = env.reset()

    for step in range(steps):
      action = env.action_space.sample()
      observation, reward, done, _ = env.step(action)

      action_list.append(action)
      observation_list.append(observation)
      reward_list.append(reward)
      done_list.append(done)

      total_steps += 1
      if total_steps >= ROLLOUT_STEPS: break

      if done: break

  observations_hash = hash_object(observation_list)
  actions_hash = hash_object(action_list)
  rewards_hash = hash_object(reward_list)
  dones_hash = hash_object(done_list)

  return observations_hash, actions_hash, rewards_hash, dones_hash

specs = [spec for spec in envs.registry.all() if spec._entry_point is not None]
@tools.params(*specs)
def test_env_semantics(spec):
  with open(ROLLOUT_FILE) as data_file:
    rollout_dict = json.load(data_file)

  if spec.id not in rollout_dict:
    if not spec.nondeterministic or should_skip_env_spec_for_tests(spec):
      logger.warn("Rollout does not exist for {}, run generate_json.py to generate rollouts for new envs".format(spec.id))
    return

  logger.info("Testing rollout for {} environment...".format(spec.id))

  observations_now, actions_now, rewards_now, dones_now = generate_rollout_hash(spec)

  assert rollout_dict[spec.id]['observations'] == observations_now, 'Observations not equal for {}'.format(spec.id)
  assert rollout_dict[spec.id]['actions'] == actions_now, 'Actions not equal for {}'.format(spec.id)
  assert rollout_dict[spec.id]['rewards'] == rewards_now, 'Rewards not equal for {}'.format(spec.id)
  assert rollout_dict[spec.id]['dones'] == dones_now, 'Dones not equal for {}'.format(spec.id)
Added test for environment semantics (#196) 2016-06-17 13:23:49 -07:00			`from __future__ import unicode_literals`
			`import json`
			`import hashlib`
			`import os`
			`import sys`

			`from nose2 import tools`
			`import logging`
			`logger = logging.getLogger(__name__)`

			`from gym import envs, spaces`

			`from gym.envs.tests.test_envs import should_skip_env_spec_for_tests`

			`DATA_DIR = os.path.dirname(__file__)`
			`ROLLOUT_STEPS = 100`
			`episodes = ROLLOUT_STEPS`
			`steps = ROLLOUT_STEPS`

Some tweaks to json rollout generation (#386) * Some tweaks to json rollout generation: - sort keys (to make diffs easier to read) - don't open and close json file so much - command line flag to allow overwriting hashes * Use a single rollout file, rather than one for each python version. 2016-10-21 19:00:36 -07:00			`ROLLOUT_FILE = os.path.join(DATA_DIR, 'rollout.json')`
Added test for environment semantics (#196) 2016-06-17 13:23:49 -07:00
			`if not os.path.isfile(ROLLOUT_FILE):`
			`with open(ROLLOUT_FILE, "w") as outfile:`
			`json.dump({}, outfile, indent=2)`

			`def hash_object(unhashed):`
			`return hashlib.sha256(str(unhashed).encode('utf-16')).hexdigest()`

			`def generate_rollout_hash(spec):`
			`spaces.seed(0)`
			`env = spec.make()`
			`env.seed(0)`

			`observation_list = []`
			`action_list = []`
			`reward_list = []`
			`done_list = []`

			`total_steps = 0`
			`for episode in range(episodes):`
			`if total_steps >= ROLLOUT_STEPS: break`
			`observation = env.reset()`

			`for step in range(steps):`
			`action = env.action_space.sample()`
			`observation, reward, done, _ = env.step(action)`

			`action_list.append(action)`
			`observation_list.append(observation)`
			`reward_list.append(reward)`
			`done_list.append(done)`

			`total_steps += 1`
			`if total_steps >= ROLLOUT_STEPS: break`

			`if done: break`

			`observations_hash = hash_object(observation_list)`
			`actions_hash = hash_object(action_list)`
			`rewards_hash = hash_object(reward_list)`
			`dones_hash = hash_object(done_list)`

			`return observations_hash, actions_hash, rewards_hash, dones_hash`

			`specs = [spec for spec in envs.registry.all() if spec._entry_point is not None]`
			`@tools.params(*specs)`
			`def test_env_semantics(spec):`
			`with open(ROLLOUT_FILE) as data_file:`
			`rollout_dict = json.load(data_file)`

			`if spec.id not in rollout_dict:`
			`if not spec.nondeterministic or should_skip_env_spec_for_tests(spec):`
			`logger.warn("Rollout does not exist for {}, run generate_json.py to generate rollouts for new envs".format(spec.id))`
			`return`

			`logger.info("Testing rollout for {} environment...".format(spec.id))`

			`observations_now, actions_now, rewards_now, dones_now = generate_rollout_hash(spec)`

			`assert rollout_dict[spec.id]['observations'] == observations_now, 'Observations not equal for {}'.format(spec.id)`
			`assert rollout_dict[spec.id]['actions'] == actions_now, 'Actions not equal for {}'.format(spec.id)`
			`assert rollout_dict[spec.id]['rewards'] == rewards_now, 'Rewards not equal for {}'.format(spec.id)`
			`assert rollout_dict[spec.id]['dones'] == dones_now, 'Dones not equal for {}'.format(spec.id)`