From 90d34a8d617ba10cfc57a1b788a68892abb0a5ec Mon Sep 17 00:00:00 2001 From: pseudo-rnd-thoughts Date: Wed, 2 Jul 2025 22:33:00 +0000 Subject: [PATCH] =?UTF-8?q?Deploying=20to=20gh-pages=20from=20@=20Farama-F?= =?UTF-8?q?oundation/Gymnasium@7f11576fe64633b2c5237194cf061e8501b78f17=20?= =?UTF-8?q?=F0=9F=9A=80?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .buildinfo | 2 +- 404.html | 7 +- README/index.html | 7 +- .../tutorials_python.zip | Bin 117152 -> 127435 bytes .../action_masking_taxi.py | 297 +++++ .../tutorials_jupyter.zip | Bin 142798 -> 154666 bytes .../action_masking_taxi.ipynb | 86 ++ .../sphx_glr_action_masking_taxi_thumb.png | Bin 0 -> 10846 bytes _images/taxi_v3_action_masking_comparison.png | Bin 0 -> 111154 bytes _modules/gymnasium/core/index.html | 7 +- .../envs/functional_jax_env/index.html | 7 +- .../gymnasium/envs/registration/index.html | 7 +- .../experimental/functional/index.html | 7 +- _modules/gymnasium/spaces/box/index.html | 7 +- _modules/gymnasium/spaces/dict/index.html | 7 +- _modules/gymnasium/spaces/discrete/index.html | 7 +- _modules/gymnasium/spaces/graph/index.html | 7 +- .../gymnasium/spaces/multi_binary/index.html | 7 +- .../spaces/multi_discrete/index.html | 7 +- _modules/gymnasium/spaces/oneof/index.html | 7 +- _modules/gymnasium/spaces/sequence/index.html | 7 +- _modules/gymnasium/spaces/space/index.html | 7 +- _modules/gymnasium/spaces/text/index.html | 7 +- _modules/gymnasium/spaces/tuple/index.html | 7 +- _modules/gymnasium/spaces/utils/index.html | 7 +- .../gymnasium/utils/env_checker/index.html | 7 +- _modules/gymnasium/utils/ezpickle/index.html | 7 +- .../gymnasium/utils/performance/index.html | 7 +- _modules/gymnasium/utils/play/index.html | 7 +- .../gymnasium/utils/save_video/index.html | 7 +- _modules/gymnasium/utils/seeding/index.html | 7 +- .../utils/step_api_compatibility/index.html | 7 +- .../vector/async_vector_env/index.html | 7 +- .../vector/sync_vector_env/index.html | 7 +- .../gymnasium/vector/utils/misc/index.html | 7 +- .../vector/utils/shared_memory/index.html | 7 +- .../vector/utils/space_utils/index.html | 7 +- .../gymnasium/vector/vector_env/index.html | 7 +- .../wrappers/array_conversion/index.html | 7 +- .../wrappers/atari_preprocessing/index.html | 7 +- _modules/gymnasium/wrappers/common/index.html | 7 +- .../wrappers/jax_to_numpy/index.html | 7 +- .../wrappers/jax_to_torch/index.html | 7 +- .../wrappers/numpy_to_torch/index.html | 7 +- .../gymnasium/wrappers/rendering/index.html | 7 +- .../wrappers/stateful_action/index.html | 7 +- .../wrappers/stateful_observation/index.html | 7 +- .../wrappers/stateful_reward/index.html | 7 +- .../wrappers/transform_action/index.html | 7 +- .../wrappers/transform_observation/index.html | 7 +- .../wrappers/transform_reward/index.html | 7 +- .../vector/array_conversion/index.html | 7 +- .../wrappers/vector/common/index.html | 7 +- .../vector/dict_info_to_list/index.html | 7 +- .../wrappers/vector/jax_to_numpy/index.html | 7 +- .../wrappers/vector/jax_to_torch/index.html | 7 +- .../wrappers/vector/numpy_to_torch/index.html | 7 +- .../vector/stateful_observation/index.html | 7 +- .../vector/stateful_reward/index.html | 7 +- .../vector/vectorize_action/index.html | 7 +- .../vector/vectorize_observation/index.html | 7 +- .../vector/vectorize_reward/index.html | 7 +- _modules/index.html | 7 +- .../taxi_v3_action_masking_comparison.png | Bin 0 -> 111154 bytes api/env/index.html | 11 +- api/functional/index.html | 7 +- api/registry/index.html | 7 +- api/spaces/composite/index.html | 7 +- api/spaces/fundamental/index.html | 7 +- api/spaces/index.html | 7 +- api/spaces/utils/index.html | 7 +- api/utils/index.html | 7 +- api/vector/async_vector_env/index.html | 7 +- api/vector/index.html | 7 +- api/vector/sync_vector_env/index.html | 7 +- api/vector/utils/index.html | 7 +- api/vector/wrappers/index.html | 7 +- api/wrappers/action_wrappers/index.html | 7 +- api/wrappers/index.html | 7 +- api/wrappers/misc_wrappers/index.html | 7 +- api/wrappers/observation_wrappers/index.html | 7 +- api/wrappers/reward_wrappers/index.html | 7 +- api/wrappers/table/index.html | 7 +- environments/atari/adventure/index.html | 7 +- environments/atari/air_raid/index.html | 7 +- environments/atari/alien/index.html | 7 +- environments/atari/amidar/index.html | 7 +- environments/atari/assault/index.html | 7 +- environments/atari/asterix/index.html | 7 +- environments/atari/asteroids/index.html | 7 +- environments/atari/atlantis/index.html | 7 +- environments/atari/atlantis2/index.html | 7 +- environments/atari/backgammon/index.html | 7 +- environments/atari/bank_heist/index.html | 7 +- environments/atari/basic_math/index.html | 7 +- environments/atari/battle_zone/index.html | 7 +- environments/atari/beam_rider/index.html | 7 +- environments/atari/berzerk/index.html | 7 +- environments/atari/blackjack/index.html | 7 +- environments/atari/bowling/index.html | 7 +- environments/atari/boxing/index.html | 7 +- environments/atari/breakout/index.html | 7 +- environments/atari/carnival/index.html | 7 +- environments/atari/casino/index.html | 7 +- environments/atari/centipede/index.html | 7 +- environments/atari/chopper_command/index.html | 7 +- environments/atari/crazy_climber/index.html | 7 +- environments/atari/crossbow/index.html | 7 +- environments/atari/darkchambers/index.html | 7 +- environments/atari/defender/index.html | 7 +- environments/atari/demon_attack/index.html | 7 +- environments/atari/donkey_kong/index.html | 7 +- environments/atari/double_dunk/index.html | 7 +- environments/atari/earthworld/index.html | 7 +- environments/atari/elevator_action/index.html | 7 +- environments/atari/enduro/index.html | 7 +- environments/atari/entombed/index.html | 7 +- environments/atari/et/index.html | 7 +- environments/atari/fishing_derby/index.html | 7 +- environments/atari/flag_capture/index.html | 7 +- environments/atari/freeway/index.html | 7 +- environments/atari/frogger/index.html | 7 +- environments/atari/frostbite/index.html | 7 +- environments/atari/galaxian/index.html | 7 +- environments/atari/gopher/index.html | 7 +- environments/atari/gravitar/index.html | 7 +- environments/atari/hangman/index.html | 7 +- environments/atari/haunted_house/index.html | 7 +- environments/atari/hero/index.html | 7 +- .../atari/human_cannonball/index.html | 7 +- environments/atari/ice_hockey/index.html | 7 +- environments/atari/index.html | 7 +- environments/atari/jamesbond/index.html | 7 +- environments/atari/journey_escape/index.html | 7 +- environments/atari/kaboom/index.html | 7 +- environments/atari/kangaroo/index.html | 7 +- environments/atari/keystone_kapers/index.html | 7 +- environments/atari/king_kong/index.html | 7 +- environments/atari/klax/index.html | 7 +- environments/atari/koolaid/index.html | 7 +- environments/atari/krull/index.html | 7 +- environments/atari/kung_fu_master/index.html | 7 +- environments/atari/laser_gates/index.html | 7 +- environments/atari/lost_luggage/index.html | 7 +- environments/atari/mario_bros/index.html | 7 +- environments/atari/miniature_golf/index.html | 7 +- .../atari/montezuma_revenge/index.html | 7 +- environments/atari/mr_do/index.html | 7 +- environments/atari/ms_pacman/index.html | 7 +- environments/atari/name_this_game/index.html | 7 +- environments/atari/othello/index.html | 7 +- environments/atari/pacman/index.html | 7 +- environments/atari/phoenix/index.html | 7 +- environments/atari/pitfall/index.html | 7 +- environments/atari/pitfall2/index.html | 7 +- environments/atari/pong/index.html | 7 +- environments/atari/pooyan/index.html | 7 +- environments/atari/private_eye/index.html | 7 +- environments/atari/qbert/index.html | 7 +- environments/atari/riverraid/index.html | 7 +- environments/atari/road_runner/index.html | 7 +- environments/atari/robotank/index.html | 7 +- environments/atari/seaquest/index.html | 7 +- environments/atari/sir_lancelot/index.html | 7 +- environments/atari/skiing/index.html | 7 +- environments/atari/solaris/index.html | 7 +- environments/atari/space_invaders/index.html | 7 +- environments/atari/space_war/index.html | 7 +- environments/atari/star_gunner/index.html | 7 +- environments/atari/superman/index.html | 7 +- environments/atari/surround/index.html | 7 +- environments/atari/tennis/index.html | 7 +- environments/atari/tetris/index.html | 7 +- environments/atari/tic_tac_toe_3d/index.html | 7 +- environments/atari/time_pilot/index.html | 7 +- environments/atari/trondead/index.html | 7 +- environments/atari/turmoil/index.html | 7 +- environments/atari/tutankham/index.html | 7 +- environments/atari/up_n_down/index.html | 7 +- environments/atari/venture/index.html | 7 +- environments/atari/video_checkers/index.html | 7 +- environments/atari/video_chess/index.html | 7 +- environments/atari/video_cube/index.html | 7 +- environments/atari/video_pinball/index.html | 7 +- environments/atari/wizard_of_wor/index.html | 7 +- environments/atari/word_zapper/index.html | 7 +- environments/atari/yars_revenge/index.html | 7 +- environments/atari/zaxxon/index.html | 7 +- environments/box2d/bipedal_walker/index.html | 7 +- environments/box2d/car_racing/index.html | 7 +- environments/box2d/index.html | 7 +- environments/box2d/lunar_lander/index.html | 7 +- .../classic_control/acrobot/index.html | 7 +- .../classic_control/cart_pole/index.html | 7 +- environments/classic_control/index.html | 7 +- .../classic_control/mountain_car/index.html | 7 +- .../mountain_car_continuous/index.html | 7 +- .../classic_control/pendulum/index.html | 7 +- environments/mujoco/ant/index.html | 7 +- environments/mujoco/half_cheetah/index.html | 7 +- environments/mujoco/hopper/index.html | 7 +- environments/mujoco/humanoid/index.html | 7 +- .../mujoco/humanoid_standup/index.html | 7 +- environments/mujoco/index.html | 7 +- .../inverted_double_pendulum/index.html | 7 +- .../mujoco/inverted_pendulum/index.html | 7 +- environments/mujoco/pusher/index.html | 7 +- environments/mujoco/reacher/index.html | 7 +- environments/mujoco/swimmer/index.html | 7 +- environments/mujoco/walker2d/index.html | 7 +- .../third_party_environments/index.html | 7 +- environments/toy_text/blackjack/index.html | 7 +- .../toy_text/cliff_walking/index.html | 7 +- .../cliff_walking_slippery/index.html | 7 +- environments/toy_text/frozen_lake/index.html | 7 +- environments/toy_text/index.html | 7 +- environments/toy_text/taxi/index.html | 7 +- genindex/index.html | 7 +- gym_release_notes/index.html | 7 +- gymnasium_release_notes/index.html | 7 +- index.html | 9 +- introduction/basic_usage/index.html | 7 +- introduction/create_custom_env/index.html | 7 +- introduction/gym_compatibility/index.html | 767 ------------ introduction/migration_guide/index.html | 146 +-- introduction/record_agent/index.html | 7 +- introduction/speed_up_env/index.html | 13 +- introduction/train_agent/index.html | 7 +- objects.inv | Bin 6368 -> 6394 bytes py-modindex/index.html | 7 +- search/index.html | 7 +- searchindex.js | 2 +- tutorials/gymnasium_basics/README/index.html | 7 +- .../environment_creation/index.html | 9 +- .../handling_time_limits/index.html | 9 +- .../implementing_custom_wrappers/index.html | 9 +- tutorials/gymnasium_basics/index.html | 7 +- .../load_quadruped_model/index.html | 9 +- tutorials/index.html | 12 +- tutorials/third-party-tutorials/index.html | 7 +- tutorials/training_agents/README/index.html | 7 +- .../action_masking_taxi/index.html | 1025 +++++++++++++++++ .../blackjack_q_learning/index.html | 15 +- .../frozenlake_q_learning/index.html | 9 +- tutorials/training_agents/index.html | 18 +- .../mujoco_reinforce/index.html | 9 +- .../training_agents/vector_a2c/index.html | 9 +- 247 files changed, 2658 insertions(+), 1355 deletions(-) create mode 100644 _downloads/59d32aca01d2a167e2c4cd11db2248db/action_masking_taxi.py create mode 100644 _downloads/f568409c70f62ce68a7552285b9724db/action_masking_taxi.ipynb create mode 100644 _images/sphx_glr_action_masking_taxi_thumb.png create mode 100644 _images/taxi_v3_action_masking_comparison.png create mode 100644 _static/img/tutorials/taxi_v3_action_masking_comparison.png delete mode 100644 introduction/gym_compatibility/index.html create mode 100644 tutorials/training_agents/action_masking_taxi/index.html diff --git a/.buildinfo b/.buildinfo index 8a0801519..4f9cab126 100644 --- a/.buildinfo +++ b/.buildinfo @@ -1,4 +1,4 @@ # Sphinx build info version 1 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. -config: cf2f46ba41b047a4e64ef75619dcaa75 +config: 6d4f87dbf34d776c4b3c01f5217c4cd7 tags: d77d1c0d9ca2f4c8421862c7c5a0d620 diff --git a/404.html b/404.html index 0c2596cb8..0bf859d4c 100644 --- a/404.html +++ b/404.html @@ -221,8 +221,7 @@
  • Create a Custom Environment
  • Recording Agents
  • Speeding Up Training
  • -
  • Compatibility with Gym
  • -
  • Migration Guide - v0.21 to v1.0.0
  • +
  • Gym Migration Guide
  • API

  • Training Agents

    API

  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -301,6 +300,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -300,6 +299,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents
      +
    • Action Masking in the Taxi Environment
    • +
    • Running the Experiment
    • +
    • Visualizing Results
    • +
    • Results Analysis
    • Solving Blackjack with Tabular Q-Learning
    • Solving Frozenlake with Tabular Q-Learning
    • Training using REINFORCE for Mujoco
    • diff --git a/introduction/gym_compatibility/index.html b/introduction/gym_compatibility/index.html deleted file mode 100644 index c81691f3b..000000000 --- a/introduction/gym_compatibility/index.html +++ /dev/null @@ -1,767 +0,0 @@ - - - - - - - - - - - - - - - Compatibility with Gym - Gymnasium Documentation - - - - - - - - - - - - - -
      -
      -
      - -
      - -
      -
      - - -
      -
      -
      -
      - - - - - - - - Contents - - - - - - Menu - - - - - - - - Expand - - - - - - Light mode - - - - - - - - - - - - - - Dark mode - - - - - - - Auto light/dark mode - - - - - - - - - - - - - - - - - -
      - - -
      - - - - - -
      -
      -
      - - - - - Back to top - -
      - -
      - -
      -
      - -
      -

      Compatibility with Gym

      -

      Gymnasium provides a number of compatibility methods for using older Gym Environment implementations.

      -
      -

      Loading OpenAI Gym environments

      -

      For environments that are registered solely in OpenAI Gym and not in Gymnasium, Gymnasium v0.26.3 and above allows importing them through either a special environment or a wrapper. The "GymV26Environment-v0" environment was introduced in Gymnasium v0.26.3, and allows importing of Gym environments through the env_name argument along with other relevant kwargs environment kwargs. To perform conversion through a wrapper, the environment itself can be passed to the wrapper EnvCompatibility through the env kwarg.

      -
      import gymnasium as gym
      -
      -env = gym.make("GymV26Environment-v0", env_id="GymEnv-v1")
      -
      -
      -
      -
      -

      Gym v0.21 Environment Compatibility

      -

      A number of environments have not updated to the recent Gym changes, in particular since v0.21. This update is significant for the introduction of termination and truncation signatures in favour of the previously used done. To allow backward compatibility, Gym and Gymnasium v0.26+ include an apply_api_compatibility kwarg when calling make() that automatically converts a v0.21 API compliant environment to one that is compatible with v0.26+.

      -
      import gym
      -
      -env = gym.make("OldV21Env-v0", apply_api_compatibility=True)
      -
      -
      -

      Additionally, in Gymnasium we provide specialist environments for compatibility that for env_id will call gym.make.

      -
      import gymnasium
      -
      -env = gymnasium.make("GymV21Environment-v0", env_id="CartPole-v1", render_mode="human")
      -# or
      -env = gymnasium.make("GymV21Environment-v0", env=OldV21Env())
      -
      -
      -
      -
      -
      -

      Step API Compatibility

      -

      If environments implement the (old) done step API, Gymnasium provides both functions (gymnasium.utils.step_api_compatibility.convert_to_terminated_truncated_step_api()) and wrappers (gymnasium.wrappers.StepAPICompatibility) that will convert an environment with the old step API (using done) to the new step API (using termination and truncation).

      -
      -
      - -
      -
      - -
      - -
      -
      -
      - - - - - - - - - - - - - - - - - - \ No newline at end of file diff --git a/introduction/migration_guide/index.html b/introduction/migration_guide/index.html index 6e88f3a60..4a9b06e41 100644 --- a/introduction/migration_guide/index.html +++ b/introduction/migration_guide/index.html @@ -8,11 +8,11 @@ - + - Migration Guide - v0.21 to v1.0.0 - Gymnasium Documentation + Gym Migration Guide - Gymnasium Documentation @@ -221,8 +221,7 @@
    • Create a Custom Environment
    • Recording Agents
    • Speeding Up Training
    • -
    • Compatibility with Gym
    • -
    • Migration Guide - v0.21 to v1.0.0
    • +
    • Gym Migration Guide

    API

      @@ -302,6 +301,10 @@
  • Training Agents
      +
    • Action Masking in the Taxi Environment
    • +
    • Running the Experiment
    • +
    • Visualizing Results
    • +
    • Results Analysis
    • Solving Blackjack with Tabular Q-Learning
    • Solving Frozenlake with Tabular Q-Learning
    • Training using REINFORCE for Mujoco
    • @@ -373,8 +376,8 @@
      -
      -

      Migration Guide - v0.21 to v1.0.0

      +
      +

      Gym Migration Guide

      Who Should Read This Guide?

      If you’re new to Gymnasium: You can probably skip this page! This guide is for users migrating from older versions of OpenAI Gym. If you’re just starting with RL, head to Basic Usage instead.

      @@ -384,12 +387,14 @@

      Why Did the API Change?

      Gymnasium is a fork of OpenAI Gym v0.26, which introduced breaking changes from Gym v0.21. These changes weren’t made lightly - they solved important problems that made RL research and development more difficult.

      -

      The main issues with the old API were: -- Ambiguous episode endings: The single done flag couldn’t distinguish between “task completed” and “time limit reached” -- Inconsistent seeding: Random number generation was unreliable and hard to reproduce -- Rendering complexity: Switching between visual modes was unnecessarily complicated -- Reproducibility problems: Subtle bugs made it difficult to reproduce research results

      -

      For environments still using the v0.21 API, see the compatibility guide.

      +

      The main issues with the old API were:

      +
        +
      • Ambiguous episode endings: The single done flag couldn’t distinguish between “task completed” and “time limit reached”

      • +
      • Inconsistent seeding: Random number generation was unreliable and hard to reproduce

      • +
      • Rendering complexity: Switching between visual modes was unnecessarily complicated

      • +
      • Reproducibility problems: Subtle bugs made it difficult to reproduce research results

      • +
      +

      For environments that can’t be updated, see the compatibility guide section below.

      Quick Reference: Complete Changes Table

      @@ -500,8 +505,7 @@

      Old: import gym New: import gymnasium as gym

      Why: Gymnasium is a separate project that maintains and improves upon the original Gym codebase.

      -
      # Update your imports
      -# OLD
      +
      # OLD
       import gym
       
       # NEW
      @@ -666,69 +670,6 @@ pass

      This makes time limit detection much cleaner and more explicit.

      -
      
      -## Updating Your Training Code
      -
      -### Basic Training Loop Migration
      -
      -**Old v0.21 pattern**:
      -```python
      -for episode in range(num_episodes):
      -    obs = env.reset()
      -    done = False
      -
      -    while not done:
      -        action = agent.get_action(obs)
      -        next_obs, reward, done, info = env.step(action)
      -
      -        # Train agent (this may have bugs due to ambiguous 'done')
      -        agent.learn(obs, action, reward, next_obs, done)
      -        obs = next_obs
      -
      -
      -

      New v0.26+ pattern:

      -
      for episode in range(num_episodes):
      -    obs, info = env.reset(seed=episode)  # Optional: unique seed per episode
      -    terminated, truncated = False, False
      -
      -    while not (terminated or truncated):
      -        action = agent.get_action(obs)
      -        next_obs, reward, terminated, truncated, info = env.step(action)
      -
      -        # Train agent with proper termination handling
      -        agent.learn(obs, action, reward, next_obs, terminated)
      -        obs = next_obs
      -
      -
      -
      -

      Q-Learning Update Migration

      -

      Old v0.21 (potentially incorrect):

      -
      def update_q_value(obs, action, reward, next_obs, done):
      -    if done:
      -        target = reward  # Assumes all episode endings are natural terminations
      -    else:
      -        target = reward + gamma * max(q_table[next_obs])
      -
      -    q_table[obs][action] += lr * (target - q_table[obs][action])
      -
      -
      -

      New v0.26+ (correct):

      -
      def update_q_value(obs, action, reward, next_obs, terminated):
      -    if terminated:
      -        # Natural termination - no future value
      -        target = reward
      -    else:
      -        # Episode continues - truncation has no impact on the possible future value
      -        target = reward + gamma * max(q_table[next_obs])
      -
      -    q_table[obs][action] += lr * (target - q_table[obs][action])
      -
      -
      -
      -
      -

      Deep RL Framework Migration

      -

      Most libraries have already updated, see their documentation for more information.

      -

      Environment-Specific Changes

      @@ -755,14 +696,30 @@ for episode in range(num_episodes):

      Compatibility Helpers

      -
      -

      Using Old Environments

      -

      If you need to use an environment that hasn’t been updated to the new API:

      -

      ```python -# For environments still using old gym -env = gym.make(“GymV21Environment-v0”, env_id=”OldEnv-v0”)

      -

      # This wrapper converts old API to new API automatically

      -

      For more details, see the compatibility guide <gym_compatibility>_.

      +
      +

      Loading OpenAI Gym environments

      +

      For environments that can’t be updated to Gymnasium, we provide compatibility wrappers either for v21 and v26 style environments, where either the environment name or the environment itself can be passed.

      +
      import gymnasium
      +import shimmy  # install shimmy with `pip install shimmy`
      +
      +gymnasium.register_envs(shimmy)
      +
      +
      +# Gym v0.21 style environments
      +env = gymnasium.make("GymV21Environment-v0", env_id="CartPole-v1")
      +# or
      +env = gymnasium.make("GymV21Environment-v0", env=OldV21Env())
      +
      +# Gym v0.26 style environments
      +env = gymnasium.make("GymV26Environment-v0", env_id="Cartpole-v1")
      +# or
      +env = gymnasium.make("GymV26Environment-v0", env=OldV26Env())
      +
      +
      +
      +
      +

      Step API Compatibility

      +

      If environments implement the (old) done step API, Gymnasium provides functions (convert_to_terminated_truncated_step_api() and convert_to_done_step_api()) that will convert an environment with the old step API (using done) to the new step API (using termination and truncation), and vice versa.

      @@ -776,7 +733,7 @@ env = gym.make(“GymV21Environment-v0”, env_id=”OldEnv-v0”)

    • [ ] Random seeding uses the seed parameter in reset()

    • [ ] Training algorithms properly distinguish termination types

    -

    Use the from gymnasium.utils.env_checker import check_env to verify their implementation.

    +

    Use the check_env() to verify their implementation.

    Getting Help

    @@ -789,7 +746,7 @@ env = gym.make(“GymV21Environment-v0”, env_id=”OldEnv-v0”)

    Common resources:

    @@ -812,7 +769,7 @@ env = gym.make(“GymV21Environment-v0”, env_id=”OldEnv-v0”)

    - + @@ -821,7 +778,7 @@ env = gym.make(“GymV21Environment-v0”, env_id=”OldEnv-v0”)

    Previous -
    Compatibility with Gym
    +
    Speeding Up Training
    @@ -865,7 +822,7 @@ env = gym.make(“GymV21Environment-v0”, env_id=”OldEnv-v0”)

      -
    • Migration Guide - v0.21 to v1.0.0

      API

        @@ -302,6 +301,10 @@
    • Training Agents

      API

        @@ -302,6 +301,10 @@
    • Training Agents

      API

        @@ -302,6 +301,10 @@
    • Training Agents
        +
      • Action Masking in the Taxi Environment
      • +
      • Running the Experiment
      • +
      • Visualizing Results
      • +
      • Results Analysis
      • Solving Blackjack with Tabular Q-Learning
      • Solving Frozenlake with Tabular Q-Learning
      • Training using REINFORCE for Mujoco
      • diff --git a/objects.inv b/objects.inv index 0e74c03b82eea253a391e134cbdef15dd815e0f4..7e5d46657fe8a8ec016e0b76e0460b84d1f95b5e 100644 GIT binary patch delta 6328 zcmV;p7)R&eG5Rr(dViCgII@7>`&SU*^IBcI-hJ9QaUwi++cUHF*xUB(#Mu`@1*$5h z0bwrPUH+BczYCSAndMuoPXQF%SS>=XB0OTOE{{q zwym>W*K)gBl8c64m}d|M8J4n^1@Ox%u34Fi0(GidKq1?cr%K##p8D&FUBl}~w&*g{ zyiC zajz0sP+RZft!wILTmZ7a31k@h9k&|QmAJH;wRfuTlmZJ$c1|uOTQB9(?F-r4>y>dL zYHo@EHZHGiaQ~MXOdR@V)ag!r{)L{c7v6YvmDV2pB7Z+aSGsX^f2Pj(A_FJ-)nzX_ zhQLK@Zuea&FE`8MKiP8(=WgE*r+#J6MEG=8nO6W`qN&kdg-o^UD}c!+=-}4;kTq>B z>j_rMuevpjucnqcxdHkfu7f094Hv(SOIC1Wi06;nXJr~6v%`@$ZTtw8PDdd9g$V|t zFNCvkmVd6orH76_J&a-?}-DNcoYvOj$ zZB}M&#`2Js;vm{$+vQX}0HNc&)!3|HhnK*@#l0$(jLeqB)@DaL7avaRnAv3_!=wT zWl3we6p1J*0X2i_JGy5;tX1KKR!S}cU*Wwr0&W)q8Tf0 z$$zIVZ?m7EcUJ9x(OnraR^ONjYt_Axq}4TULb*=qu2lCvm;Cd7VcnCuE9;(Stf+fm z`S*^O313)8tiGVwtm5nK1n{L{kDr&yXLv>$^BL1_1uw!Sw za5ezA)Ut~AIgDQT013ClHh1ZvZolzXO@GV1w(1?((rey|g;)F=e{L7|U#Psg+ftBK zz16o)Td<&^OWl>NTr*ZQ@f}2OlSp)9z64|lOE6Q6sHQ>P#$*&743bdoUoM?rh{=OC zk;OsA9kb}i-*Tl$a0~R0@lLsaGBgP(!5Co7Y`9v6cp*4L+jSEq7yG&A_P=gQk$>Pe zy$`!|ss8jqm&!nPVKXl`MZYpQMS|91e=_aXLN2q^q_DD$&w3jF@+(Dx+qGHV+@iBf zvw|4%YPJ+JbRK5}_{%FGV$*DfL@S`#$KpfZ#5xJRBm;KD5ajrBt7j6&w95kIOd zd4T(S_v4F9%$(3571bbUbW0Jv8?-;HP5sS$_&!G5*w3+ zUPN>2b7(m?ID2BO4a`e9U6H$O2el`{qw#qo91YFM=?bii&5F`^ZQAx^8TMrbX&X0n zds8g^j7zzJ_&4YAm1?@CUGoZ?cBT8OTlzPbu5CZ42g1FJJ){@2Z+~K6*F#!2u`dSc z?K103yMj^nE$T~1_EsN=vNYZxlC7pYK=XjsIA+^8;$YX{kH~wT^;e&q-5Gy%<*Nq1 zZ*$S5YNl&c(`KVvovCe*t7tpcCP(93p*JSUIRmc%<8GYDdt`O9iYDaL08SLF!r;D8 z9`mAVPcf@&atbJv)_)vX&C|Hxg{W8YvX<8?3kVjav0SOWnpICV*o9LyS0Ij>h&AHg z7#hA;-0qXFrCGkRMBqMXk0%a%%jJ0Bz+{2_83ft(?kiY|tWW5)WF->g-F+^?$53#Gq?|9bD4hF|Xjf z&9mxFV!dpRhjAyU`(gX>l7|cj)H|ND)75Y3JKP>~b?W;pZ(pGPy;o~-*XP!(;9pyo zJX{_90a{Fxu>AVh_~))*rE2Kwo6fK7`J4EyE2`5qK;J~299M!qvFA5s`t>2Ju72fy z!!^Y``@vt1e1D}jFYm~8uIJ|(D#~5C2h{rN@&z=rM-BnPTeV)jl6TJ&QKxrR)`%1v zVw*K>mNZwP{<~jbTt&iW_EzLMxBCTOoa_>=XjL|xR388xG&N6zCw+8I9=(Q ze#;8}2HNQL%|!CYtjN{|Dc|~Md#+XDo_GBc_v9;eihptx8z(~;Y7R>`_ABcV;nD_R z;2Kxs$kiImE->SgMp}}HqQDDq8Tc;9bAZ^gGP#lP{AMIurWSV-p6?~hmbKF}g&SZ( z+RPw&jqr@m5Hc%#B)k=Ii7^Km5QgVCqS&%*F}@)~$Awuc3Yn!W-Z@h`!V1rJ!XY!R z`%v8&xqpY}IwLvqCF7x`^;cn>Ihx|8CE3ncWZv@8+R@tM|#a5A6yHzS?Gmm=% z-U4GBM3WW_kGA&>otm^;(#%I3zl;roxg~i|QGb5f8^-}l44A_lCXDN(eb#w#og}dV zW|`+Vmv_H&WPmxAiP7bK?*%i&Aj_2Ma*HmZ0Vdg}OcxtPVgt;wO|vXEihzchWSpT{ zW6~TNX42KYAc<;zD`OHMl^a&k9)}(!83r1VpaB z1cH2)oR%W5QiW|RO@S!S#hhTOWzA$6>w5RXy;KqoylQ1}tQIV#y?}vNsm*G44P3$N zmirQWy$f*3zRHydUM#U}U2?f~n;n7E>3;!M1Wl)F9eksNeA66G1m~b&bm8Il%t$sf zd}rJPa(B(RPjhxoyocs&ng7;eA@lD6xx44z`;E(sr};vx@t)tCTje>Sw!{{XK>e}r zggj=|0!(ntshM)OPpt*@5zdJ^= z9QQn1fIXfQY<7d(^K2m&c}}odP4b#&3oy!mg3W4{$2?nj%U^AhYo0C4B(DiJmr2)i zSDq7WR)f6e*_L#c>&)^D*{{)eh8yah5Dav(K`!2NR&dEZTVjWM0CbI;G+6fczx+LF z+Vmf(NDvH%Tl_EDL|^co=D&$HdVi0vL%zAcd-Lwo-B?zg*+w7wd^hkzbHkEa>_81A zbGG9-%JT9tt3`=#>1wvJ7+HeDv9=cZR%>iuW$9nRB>jbtaaR3DKcc(x@n-ra?77(J z9ofU@-z^rs z9YilNqj#GbK;yTcVSxwnOPG8>%Yac2Z)v6IcRaco-ijEoXr>0l(267dER<3o#PJg#BMW5i%z@t`~j979>DjGW*I+NKVj*&lK?1^+2NmE<- zW>ynR{<@9i#E00Q5xcD7Da+$0mg9y?a}T)_&#%+%RJ`vVcR5QQ{=^rsne|(7it)XP z+d;V3PFNk+Ol~!GWq%eODYtPYbjkfX_d#cXIDNRnr(oQm z*>fj4a)+;scQBv6F%LGjVcbz>uNm2?)GGQc%ENy&PD5q(d zBzbMl$~JT2v>4VZm4C9qUVGABpK-4#9=^@-z;I&P0Xz$Cqo0N}jVvGHBgYQVh3o|p zSw2KRW12={w^Fe7=tTB{h=eqRbnTHwwr$SiAEM+=<{*hsJc#}S2PBoVBCfNPyPC#X z5SWmT?lDax>mR&+aPp)S!eoLZO}vMNH8_swr#?yY#8ck)<9`;Kk^+`W(4=P{(6i<| zn=mzJ52AC{J1qt%ouXjiyvpox8hcyBAePrD8rEc`aH3EMLHL)%KpF!BSCt*)0M;i- z-ciVJKjP994tpHbsWhXvgL+7g41e=-_0(h0ZS-z*M1uKVy>!O`)nWkDDH;ZyF1||7-HOMe2*ob`jXWa3 zqI}?|_(3?E;Ybp&@*w)Bpc`Z=I*5kjv@4y~o+Xir2hlq?pr{F(s9Ok}swdvyp^5)Mgr&JJ^WnuD%^{0qYpYo!bEj+mQo1; zNd6@;HGg}|TIX<~7Xy?|QLrN`4~4UQT522ptP(V-EAh?KN6|Ih$s5TcRUSq^;~~lB z&c==+K;m>mKjL$3P_@falskNHt^+m`2QZ$2*3h4!GRYDSB}%Xhx8u)(+vt~sL%A_c zA^*fLsP2R_m>A@?(XV}y!QbE_R^_@&Q-5I~tK;ZS9#i-SwiBXoV3p7|`ltL$ zW6A@og>ZtD7@|~)gz;0;;``ShSmlmJX3~JxCm@f?5R=I14-a2I$N?3*Y?GgVfG)&^ z0ui9V|0F<&+&#Uar2wN6B&qJ4jYY};1^qsGUFm>Lgn0{#>64xEky zdltl%6iCDPN|3e|S(!2P((ys$dlz;hjI+x67(7nCC-DM0=O57j#Wj8>!g)O|T2>*26#0@wIrj7E0(w&+J7JitS0&*lN1lXU>&!|tbuA%xC%ZM-bTNn z$~QQU@M9YkUbIJ^=dMC)scrOGB`A_tsrw?E%Uc}6W3P>tp zA-(oPy&hQP3|-~!rYqS)e=&5zSS?Ug~rhmeEeLVU_ADi({&VkM#*F*oHhdK@XA0K=w;z$yh zIMn)JtcXnqVWGS0?ZtqnQ#7ouagT@-ro<4YQWUJ^W$C=nN@yE>lYePUTYF&IT47p4 zWofe{ZW;U&JpP-jfKy?>W=Zso!9T&HzrCaJ;Crjg-R91Mhy@4zB{Q_Q7JrUY&YZSt zF~I2*3G3=YWG;88r2wT8Gzq)0BP*ONEr&Fnqaw5L|D2{qDxON5z4e zZD@&pQpe!>@c72M2gQLNZC1fWxaeM{DP-Q2Oa?Hi)84TtjFIsOV}G5Cb(z_o7bA7P zHzs3H+cJA3eow=itTxjl~poIZZRJWed(kxdE5 zrw|1sDD0XOX?q4zDM`MTXuAT#-Hiz z0WK_~!kL_&G8gkf;Y=)sSQ~Ci<%{j*&v*>b@eG+wCcl!&(^#*FIxCMuZ;K-q`Afg7 zYO7OcOmMzLhSr>_t~t8zvyy^_Apeq}nzO`%q{VP^r%aHn=6@+G3O7rO!DvP$NS5++ zubuU;m)mMzICr+~F@sp6f^PN{kAE<7O$yuS?z!c)-V#5Yz9IKYn(6&!N*LRmBK*Ym zjbs0*8|B_{L~r4AlcyUH%#CsEt{t1Bx6~dWh=;<)je22aT=sL)1FFS$ z?q)0pP7RI~FC9Bb?klal(aIaC3``DEDSw`F`m@;mz#n|<1_J4vvxdi|zy*}Ek}m(H z2tLmO{ewJ(&%f~I{P>OsjTAgTBQqmU{1bg?O|C?~@qd7HNP!%6moCZ@{dXy%HfwYK zKky^OBx$F1x~Tn?T{Bx_GRgFtFn`B`DM^1vDe0P46!XV4?2@>V3r|H12B3Iy+?`Ex zDY8SYo*OuHS!%XlM&63wRyA>P92X|bOs*R*Ej^}5$6kG zxk6t~?Gc*GVbhzi84#NRu~CT42(jrA8~M(WppqP+7UH((SWffi z_-^thq$HGnU`cw!1`!*DSWuFzsB(^%1Fg}$_3$)mK#6Rez>rRV`01=uLS zMguko2rt7hW{AJX_}NMPEuavTdRQq2!sh#?CxjP61UFDnPBA6AevVpU0$i-zbo zlV7yp0fm^WhS{&QH-mP#>H0BX_BshL`hTnxX0FoPfZohdbI;@5!<-E<_aUPJiHy!0 z9}8aE<1TQt@?rgx=;{cU0#)xm4r;uL^}_CVf!F<6pI2+W@?#}_cj*7w|E_Smzl?tG zhj7D#(mq9fVMn~c|9-^HKe`SMKSyfOW*lf!#hZ03-t!}by|cdNJe<=bPIvAv8h;xE zhXnea1fSGt7`I04k;}=c$(Y}xST7qcghvTqMgE9I8ss3f(RN)9Bg%hmK5Ai~ z!o745u^@Kn%lCc|SX024i7moHilHra@@r)Gcfb7h{`39Yy9gwrPg23BDA$WMd_#<3 zny9OyH?QBG3nFibdgTc=r{-puA%Awv^r~j9W(F+X?B#odoWk47=p-ihxk-$R7?P-YB_uKupjXIxSw#WwEf69-0=0k=6{%-tCwiFJxv8m)pUarn< z{VRy*^IERi-hJ9QaUy!$?w*IV2cbX!oFpHf0n>V`O+vYb^(lU=`y>O|y!maHgv85E~~Mk%YR z;BNsdlI^p)U2U0^3j6Cf{}pVm4m9Li2_q}x^-;v0u-p7;YJUgMp9rZoqOdAh#8HLS zb(!p%nw!<4R8;)JJdH5Ou$a}%gP#{+$?{las8f^z5?P-dRl1B(^nK1 z_C0@QWo)yulz&ogkZUEZH_HOE*+Pq7ROZQ3vZ>RR+NQ--TQemBc~ zRq;%ysdaJI)ipCV0NLJnGBoXuU5#o=Y+BXQC)G7do{1zIC!3O~m9pt}iR|okiZ~J_ z*YyB4Hm|L5|CbSr9QtO^=#G8Wh**_ zK&DmK`zDv!&C>8M_7cLq>ks{{-`ES$eLAa53xF$8S7}!vQ}ucUFj)mH+>#%XsxDpnZnRAW>67=GS4)GOq37x#RXp9*4)|aO71TK0%>tdmvrLcmvTF z!rd^57k^<=!D7jYO3rFgE`p8nYBr@{WyRM>TPNxDQhrJL{r~(KD8Zy(EYr{*d$|z*T6#Nu1Y0)=JSD7&1w!-?!}7GnwMFUuUe#_ zCgs&$l-b(MWaUzNhWh4e#vXl|D-?(JJMvH|ihnWzM>1@U95vN_?$apC=C_jR7jcvF z;3p}rZg1bHn;S~!`e*SnZQfcnh&yH~^Xd3d_d2Pwae0le!DbUdvce_8$26 zhUXEVnTSq(VLHy3B}wT97eqP?8rPA4C!FM!E?$#vT%QVRzRf{(Uy3aJtAcLFPM>im z0Jzk=2=^(BUU(1jx5G4d>7Z_Y@J3C;vwt?~9ogJGuf@z9|HfbH+3go9FK)IJWKnDN zt!XWoQPHLD!dl)k7F6*a^xj52(TzR}$Sy3wjIl>G?$m8`M$w%?659HgOXuffa<5H9 zaghCvN$E%4&o`w=aDS`L zhh4fS_*(^0FtgPdcmc~8(N|E3;b&^)s=&TjF3#NsnsZ(XSxV|wC_FeRJ6+$we|M>< zeR5=|cO9`b-LdHL!Zo@OutW0^D(jrsJKbyOPC<#QLjDAm-rEfP&oAF9_Qb=dB<2DV zk1MQU)a;T--3luxqjHXFF7q7pL_q%}$q(axv4=X8pAck1Z01;@?qhCwx@}N;P`fL!(pl(4 z)Ym?XmUV-(BgR<4oRs4Qv72^KJ0ct^pEJTz(X5;%!?IW{NR88`ZAX@7UzV4)c2l=A z#n8^!lq=}}raWA!q_?y+b6B@4-BsPtzS(q5`#~KL_Fe2gt(bWe`+u?)(zuCzHmKb$ zv&^&=j52RgpF=X&dQX(0@_La>CEWs=c4)O@wvDA9Y#aO$aZjUuaEaL-@q;a1HSoPj zMH8!;u0ctgjBeXVO@mxT+p#)2YUc`_F;U7Hcm)`D<3!#QE2~8`A*Tj#qF@mQ_l5G1 zXGMJqSy_@(K)$r<$bU*6hZ)aAxrmq4yj++-uqY1YO6_V^J(pk?PSvbH98?iwk9(u3 z_)h(Hmv{};@{OSf?t*rB=~E|L7JN7m=`<-H0^hX20NylTE@(KBlFuUYLQ4`}kgi`x(h8dSM(vnDI8D_v`$9G1YJ;W51&W-rTHzAoKHMkr9crRh5sI8vK-vAxbWCqb{ z_(yz(kWt|);k5{J>~oMELjM>C6jPKn_HW3p9l)z}*_lNO!hLG}qlO%V=-5T{PF-F7r@vwpk?B-70hMbhcF_)@+sPv+2jZ9;d)) z2hpSj{j2R=MW-h1=2Y_m$1P&bU~W#_W0YI;+JAAt90R5>iwVOrX`XeST_#Dahgtgh z&H2sm6zO4(VPbTC+k3(EF~~5bI^Uv8sE0}BDbv|TkysD2Ow%m0jUu3aCTVAAmY6h! z`kA!4x4dL}7-XK;nC~koti`O>SyF34bNu9h;})@YB4$qPQy6JNx1GeiZfM!j|CFP`Nv7z*P&2Wwl@~?G+4Mr8KMEHIRerru!1R zUItvUSIG(Q#S+8TC7W9}+2J{z?qP-3bborQgC|PJljd+DI0Xf*3-`BYLNb}*I^*sU zyKTmO9J6)e-8W{#{C6wnGym=pyM6w>+qgV?n$O1?=lQ*^<>DP@1?N1oId<3wKx;gt-m-uE^pBvbe>{)mA1WiEubpmm=M^8rwHX{5LSE{ldpEs_vs7!EOF@H9iS@DmFMHJ2-#U zp;zqBub!y&M^Xi!@hEMU$3b^)_0{>5tEpCd_EjJcFRQMov%@qh=d;Cvn}1&P5;Hj4 zOamI8eufF|#V=v<1uYFmy}Z>b1;69fRev_lRHqe2DLhf9%W|cm%G^|?Ev-Rc6t4`g zVrrBx-q;MrFKAxr-?7vXFMtm^9+?lL7vGH8(N|LqqOZk4`!1AH)@fP9r;FTL_32`G z&~|)j>S%M4mO0+S6nutD4S$bXWzu5FC8=QOZ0JZPi#S^Tbg?IBn@E~k%ad7kEcxp; zkP{zbe@5(*g2yZkpIM3HMk#!*t(=F0$00(YIfSV>X}Niv`%i6pLESSZ)hFi7(1l;w3| z#kFEss#M4Xd+SJhdw<5grFeLnIJn0! zjVyog^3lqZQV5d)k~H!j23GGlf}gt}$rI0M*Nz)#N(xviK!1~7TtF`^=S7DpIeQe1 zwcNF0fNDb&44hYuGYJ8PX7$pRfOgBx{8vqe=w@v>r-7!p;8f`Nm2 zjE)TBvbEGh(SL35esD#C`Cc8mV}Z6}0Bl1v3>sZLO3z-4hoT6@CjOngBEcem)yd_)5 zeNr8<4-MsXcd}4MvfJQ;x`ZMLmn1u7hcIG=L;raw3S_u~*0a#{qW2|-ft}S{B?UMY zph@Czu-55T3Q01cAyxHmGFfDjlQb2icn6lUmxS4ha3{76KDHqeCW@mql}ZRe@-K-g z*;7(mhkpy57@*n^1v|3*kXh5$N^OH*RDdQmIi5Uy6ivmgyn!rIbwNG!fQh-qbl2kU<$|7Zef`3Rx1IgYuFpiYpuC%~L!a#-V;6nogPq~0VXr!!y zUVrp~)!g=M2a?<16J9`b4HqO8oI;p3hXbzNSg-?8;KEh#NnKIk4E_`04xEk!dltl% z6bQrkN|3f@NuDtD(&0g*dmDBnjI+w^HF%tKPvQkM&Of023rqY?gf%}dF7A&$mv|bKaRex|NgA@(-Sq=I6T*%Ce$-UeS#oS-Z@6`awG-P04{eBqC1sf67lu+{1r9_3nv~#`)D;PSOzhKoN(f-`FNpzXUs~tS zTPXmk07=3n?l8%pSZwcDjfLCw@qggg_F9jBwhnZ9xeod#J=Ce-|M1{a5C@XL#G%$l zZ9%LW=oZ?W-cAg7ZHR`ICGHWi!ju@oREUDrJkPDqSqW`}Z}KmVsY?e;T`EkiDJ*po zg*AhJf`@;%C2%YZ*dz+RG59BV@b~vL9(-?+*z4R`5V7E(?-EUYtKmB4%ztWYD+ahW zM8cXf6N$|owo-sn0h)x(*pX#cRx5|JHc0WBBFv#v^=vD_z1%kVy$HTQ2ke@`ej=6Rj~F0cD52Y76z_7PNqGPsWRd#XLdCNS0-w+<8Dw8?3obOBa6gk=3*q< zf$tLSoW*nU12=1kefTVF&41!Zb{qUDFN3f9;7>s|jUW|=Kh%N57V=qgi?lfSkG!C$ zCstODBaxx#HuzsWK;1C@_`zOYtdrGBXbbk?->b{b9$J016$IDY-oC%G?oqK|CL3CU zpVc+EKD@p%?m@Aj2b)!J5iYowVG5ZxIg=fj*lO=k6voJSg?*iib$^-3o);~3x;G}c zQ8$7cb>qrqo1`(O*Jdtf&SP8`Q+3OW@`#u)=8VpIr>fkMo(>M96{FnB_jP8T>T8jHou7* zL8)$8Ufa|`1d2~ylYjb0mhREL@R}WMprI_zoTq#AMR-M{g|Yb^NdZn=wz{1NPJj!; zsBj|JPMM48pl~77QHQwSmZC=vZ|>} zoiX0=5)m3>Dw^tOf6ht@DuVn=f=bRJ2U07Bn>%HIWL3{emVenkFsOwmv4%*C?QwJ%z&`v|OFSHn@GMdD(7>?{8m`dnNVsZZjo}ZB7AxV*ARn z|J07M?>M5jaN5b^4Wzi6WWSgBe9=R&Y!da1>b$vh9B1&*-q%FFFU1d@L%-vZ+hZIE z%T-~xfIiA2*MG2U_LA74CNv%!Sg#Z6Y|JE(OIi=CGx}r(tja&a@140NK5eFxd`f{PWk`9 zkI*NH8@1C#?XPUA$r_VRrrU)1J6?=Q?RS)-rm96YeNDqGi5t1_R={8YiZ_SN**F$_ z#N$su>teZ(R4?b86`zy(h|h8yL6#g!^8I?Y7DFj4oTIz!(jn`l$7TBY)~}c+^JVkbl405l@FWXM`b#?oRa)D$ppSD$ely zi;0W`Njqh>bkr#49C7D22ESJCw7^DISGh`J{x>_e@EL*dSt~ z5PvgLl4M27F+0$j);aVqzj~y|#PLko5VcXLO^2G1LizjmhQ(!5;5Yb0%u}C~QTm=K zlE3$ejYQZ}GU>^MefK{69^w}w@i#+4rX4{_-JFh&uu+6fPuP6lbOirosQxW>Z|9|h z)b~rs8L=oO%Dq8HHIW~m;2w#Xs`}Zlw0}3fw!i7^8@udn>xYRm5T+h?X6}wDfwRgNi=1Et9Gho9CiqtlJ&~2Ylg@ArM<6~W#xB8 z+@8??v+r8qvVI->-i@~UcbZ+2`pQmhhVS}>`*hke*#8`;^_5{Kl}g^EVR4?yAb;$g zv^D3UP&-<)$NtKG)!&^yi1Z0l(9hwiLGw4ZYf>1t{Co4M6?RG7YkS)nPPR+mhhAVw z0$;}o`}y9!&^7W4TlcrWe);hA{^m9SiQuzTa7oH~PTAEL_j3_V5xjeQb54kSAnF(o zoEECC`dLrQ?4_LdY=@tQ_UQ5~9Dl3u_R@`edSA!rNXKn=zMekQ(HPR*(k^qRhjTQ< z=p@Y!&P1KgnHprhoCfDZqFtenJJYibMP(}L@c^a{&KE6$3%BUx U-&{PDTl@o$=Ha0J4-$Ml2eAEMEdT%j diff --git a/py-modindex/index.html b/py-modindex/index.html index 70f70563b..f12dbd4e9 100644 --- a/py-modindex/index.html +++ b/py-modindex/index.html @@ -219,8 +219,7 @@
      • Create a Custom Environment
      • Recording Agents
      • Speeding Up Training
      • -
      • Compatibility with Gym
      • -
      • Migration Guide - v0.21 to v1.0.0
      • +
      • Gym Migration Guide

      API

        @@ -300,6 +299,10 @@
    • Training Agents

      API

        @@ -299,6 +298,10 @@
    • Training Agents
        +
      • Action Masking in the Taxi Environment
      • +
      • Running the Experiment
      • +
      • Visualizing Results
      • +
      • Results Analysis
      • Solving Blackjack with Tabular Q-Learning
      • Solving Frozenlake with Tabular Q-Learning
      • Training using REINFORCE for Mujoco
      • diff --git a/searchindex.js b/searchindex.js index 494b0bba8..366354c04 100644 --- a/searchindex.js +++ b/searchindex.js @@ -1 +1 @@ -Search.setIndex({"alltitles": {"0.12.5": [[155, "release-0-12-5"]], "0.19.0": [[155, "release-0-19-0"]], "0.22.0": [[155, "release-0-22-0"]], "0.23.0": [[155, "release-0-23-0"]], "0.23.1": [[155, "release-0-23-1"]], "0.24.0": [[155, "release-0-24-0"]], "0.24.1": [[155, "release-0-24-1"]], "0.25.0": [[155, "release-0-25-0"]], "0.25.1": [[155, "release-0-25-1"]], "0.25.2": [[155, "release-0-25-2"]], "0.26.0": [[155, "release-0-26-0"]], "0.26.1": [[155, "release-0-26-1"]], "0.26.2": [[155, "release-0-26-2"]], "1. Package Name Change": [[161, "package-name-change"]], "2. Seeding and Random Number Generation": [[161, "seeding-and-random-number-generation"]], "3. Environment Reset Changes": [[161, "environment-reset-changes"]], "4. Step Function: The done \u2192 terminated/truncated Split": [[161, "step-function-the-done-terminated-truncated-split"]], "404 - Page Not Found": [[0, null]], "5. Render Mode Changes": [[161, "render-mode-changes"]], "About the Environment: Blackjack": [[164, "about-the-environment-blackjack"]], "Acrobot": [[131, null]], "Action Space": [[127, "action-space"], [128, "action-space"], [129, "action-space"], [131, "action-space"], [132, "action-space"], [133, "action-space"], [134, "action-space"], [135, "action-space"], [137, "action-space"], [138, "action-space"], [139, "action-space"], [140, "action-space"], [141, "action-space"], [142, "action-space"], [143, "action-space"], [144, "action-space"], [145, "action-space"], [146, "action-space"], [147, "action-space"], [150, "action-space"], [151, "action-space"], [152, "action-space"], [153, "action-space"], [154, "action-space"]], "Action Space Issues": [[159, "action-space-issues"]], "Action Wrappers": [[16, null]], "Action and observation spaces": [[158, "action-and-observation-spaces"]], "Adding Rendering": [[159, "adding-rendering"]], "Adding a new environment": [[1, "adding-a-new-environment"]], "Additional Methods": [[10, "additional-methods"], [11, "additional-methods"], [12, "additional-methods"]], "Additional functions": [[4, "additional-functions"]], "Advanced Environment Features": [[159, "advanced-environment-features"]], "Advantage Actor-Critic (A2C)": [[178, "advantage-actor-critic-a2c"]], "Adventure": [[22, null]], "AgileRL": [[172, "agilerl"]], "Air Raid": [[23, null]], "Algorithmic heuristics": [[163, "algorithmic-heuristics"]], "Alien": [[24, null]], "Alternative solutions": [[166, "alternative-solutions"]], "Amidar": [[25, null]], "Analyzing Training Results": [[164, "analyzing-training-results"]], "Ant": [[137, null]], "Arguments": [[127, "arguments"], [128, "arguments"], [129, "arguments"], [131, "arguments"], [132, "arguments"], [133, "arguments"], [134, "arguments"], [135, "arguments"], [137, "arguments"], [138, "arguments"], [139, "arguments"], [140, "arguments"], [141, "arguments"], [142, "arguments"], [143, "arguments"], [144, "arguments"], [145, "arguments"], [146, "arguments"], [147, "arguments"], [150, "arguments"], [151, "arguments"], [152, "arguments"], [153, "arguments"], [154, "arguments"]], "Assault": [[26, null]], "Asterix": [[27, null]], "Asteroids": [[28, null]], "AsyncVectorEnv": [[11, null]], "Atari": [[21, null]], "Atlantis": [[29, null]], "Atlantis2": [[30, null]], "Attributes": [[2, "attributes"], [5, "attributes"], [10, "attributes"], [15, "attributes"]], "Autonomous Driving environments": [[148, "autonomous-driving-environments"], [148, "id2"]], "Available Action Wrappers": [[16, "available-action-wrappers"]], "Backgammon": [[31, null]], "Bank Heist": [[32, null]], "Base Class": [[16, "base-class"]], "Basic Math": [[33, null]], "Basic Usage": [[158, null]], "Battle Zone": [[34, null]], "Beam Rider": [[35, null]], "Before You Code: Environment Design": [[159, "before-you-code-environment-design"]], "Berzerk": [[36, null]], "Best Practices Summary": [[162, "best-practices-summary"]], "Biological / Medical environments": [[148, "biological-medical-environments"]], "Bipedal Walker": [[127, null]], "Blackjack": [[37, null], [150, null]], "Boundary Handling Errors": [[159, "boundary-handling-errors"]], "Bowling": [[38, null]], "Box2D": [[126, null]], "Boxing": [[39, null]], "Breakout": [[40, null]], "Build the Documentation": [[1, "build-the-documentation"]], "Building a Q-Learning Agent": [[164, "building-a-q-learning-agent"]], "Building an agent": [[174, "building-an-agent"], [177, "building-an-agent"]], "Car Racing": [[128, null]], "Carnival": [[41, null]], "Cart Pole": [[132, null]], "Casino": [[42, null]], "Centipede": [[43, null]], "Check Environment Validity": [[159, "check-environment-validity"]], "Chopper Command": [[44, null]], "Classic Control": [[130, null]], "Cliff Walking": [[151, null]], "Cliff Walking Slippery": [[152, null]], "Close": [[166, "close"]], "Common Debug Issues": [[159, "common-debug-issues"]], "Common Environment Design Pitfalls": [[159, "common-environment-design-pitfalls"]], "Common Issues for Beginners": [[158, "common-issues-for-beginners"]], "Common Training Issues and Solutions": [[164, "common-training-issues-and-solutions"]], "Common Wrappers": [[17, "common-wrappers"]], "Comparing training performance across versions": [[136, "comparing-training-performance-across-versions"]], "Compatibility Helpers": [[161, "compatibility-helpers"]], "Compatibility with Gym": [[160, null]], "Composite Spaces": [[5, "composite-spaces"], [6, null]], "Constructing Observations": [[159, "constructing-observations"]], "Constructing Observations From Environment States": [[166, "constructing-observations-from-environment-states"]], "Converting Jax-based Functional environments to standard Env": [[3, "converting-jax-based-functional-environments-to-standard-env"]], "Core variables": [[4, "core-variables"]], "Crazy Climber": [[45, null]], "Create a Custom Environment": [[159, null]], "Creating Environment Instances": [[166, "creating-environment-instances"]], "Creating a Package": [[166, "creating-a-package"]], "Creating environments": [[2, "creating-environments"]], "Creating the Q-table": [[175, "creating-the-q-table"]], "Credits": [[127, "credits"], [128, "credits"], [129, "credits"]], "Crossbow": [[46, null]], "Darkchambers": [[47, null]], "Data Conversion Wrappers": [[17, "data-conversion-wrappers"]], "Debugging Your Environment": [[159, "debugging-your-environment"]], "Declaration and Initialization": [[166, "declaration-and-initialization"]], "Deep RL Framework Migration": [[161, "deep-rl-framework-migration"]], "Defender": [[48, null]], "Demon Attack": [[49, null]], "Description": [[127, "description"], [128, "description"], [129, "description"], [131, "description"], [132, "description"], [133, "description"], [134, "description"], [135, "description"], [137, "description"], [138, "description"], [139, "description"], [140, "description"], [141, "description"], [142, "description"], [143, "description"], [144, "description"], [145, "description"], [146, "description"], [147, "description"], [150, "description"], [151, "description"], [152, "description"], [153, "description"], [154, "description"]], "Design for Learning": [[159, "design-for-learning"]], "Domain Randomization": [[178, "domain-randomization"]], "Donkey Kong": [[50, null]], "Double Dunk": [[51, null]], "Earthworld": [[52, null]], "Economic / Financial environments": [[148, "economic-financial-environments"]], "Editing an environment page": [[1, "editing-an-environment-page"]], "Electrical / Energy environments": [[148, "electrical-energy-environments"]], "Elevator Action": [[53, null]], "Enduro": [[54, null]], "Entombed": [[55, null]], "Env": [[2, null]], "Environment Checking": [[9, "environment-checking"]], "Environment __init__": [[159, "environment-init"]], "Environment pickling": [[9, "environment-pickling"]], "Environment-Specific Changes": [[161, "environment-specific-changes"]], "Epilogue": [[170, "epilogue"]], "Episode End": [[131, "episode-end"], [132, "episode-end"], [133, "episode-end"], [134, "episode-end"], [137, "episode-end"], [138, "episode-end"], [139, "episode-end"], [140, "episode-end"], [141, "episode-end"], [142, "episode-end"], [143, "episode-end"], [144, "episode-end"], [145, "episode-end"], [146, "episode-end"], [147, "episode-end"], [150, "episode-end"], [151, "episode-end"], [152, "episode-end"], [153, "episode-end"], [154, "episode-end"]], "Episode Termination": [[127, "episode-termination"], [128, "episode-termination"], [129, "episode-termination"]], "Episode Truncation": [[135, "episode-truncation"]], "Et": [[56, null]], "Exact reproducibility": [[136, "exact-reproducibility"]], "Executing an action": [[164, "executing-an-action"], [174, "executing-an-action"]], "Explaining the Code Step by Step": [[158, "explaining-the-code-step-by-step"]], "Exploration vs Exploitation": [[164, "exploration-vs-exploitation"]], "External Environments": [[148, null]], "First-Party Environments": [[148, "first-party-environments"]], "Fishing Derby": [[57, null]], "Flag Capture": [[58, null]], "Freeway": [[59, null]], "Frogger": [[60, null]], "Frostbite": [[61, null]], "Frozen Lake": [[153, null]], "Functional Env": [[3, null]], "Fundamental Spaces": [[5, "fundamental-spaces"], [7, null]], "Galaxian": [[62, null]], "Game environments": [[148, "game-environments"]], "Generate your environment": [[166, "generate-your-environment"]], "Getting Help": [[161, "getting-help"]], "Gopher": [[63, null]], "Gravitar": [[64, null]], "GridWorld Example Design": [[159, "gridworld-example-design"]], "Gym Release Notes": [[155, null]], "Gym v0.21 Environment Compatibility": [[160, "gym-v0-21-environment-compatibility"]], "Gymnasium Basics": [[165, null], [169, null], [171, "gymnasium-basics"]], "Gymnasium Release Notes": [[156, null]], "Gymnasium v1.1.1": [[156, "release-v1-1-1"]], "Gymnasium-docs": [[1, null]], "Gymnasium.vector.VectorEnv": [[10, "gymnasium-vector-vectorenv"]], "Half Cheetah": [[138, null]], "Handling Time Limits": [[167, null]], "Hangman": [[65, null]], "Haunted House": [[66, null]], "Hero": [[67, null]], "Hopper": [[139, null]], "Human Cannonball": [[68, null]], "Humanoid": [[140, null]], "Humanoid Standup": [[141, null]], "Ice Hockey": [[69, null]], "Implemented Action wrappers": [[14, "implemented-action-wrappers"]], "Implemented Data Conversion wrappers": [[14, "implemented-data-conversion-wrappers"]], "Implemented Observation wrappers": [[14, "implemented-observation-wrappers"]], "Implemented Reward wrappers": [[14, "implemented-reward-wrappers"]], "Implemented Wrappers": [[18, "implemented-wrappers"], [19, "implemented-wrappers"]], "Implementing Custom Wrappers": [[168, null]], "Implementing environments": [[2, "implementing-environments"]], "Importance in learning code": [[167, "importance-in-learning-code"]], "Imports and Environment Setup": [[174, "imports-and-environment-setup"]], "Information": [[150, "information"], [151, "information"], [152, "information"], [153, "information"], [154, "information"]], "Inheriting from gymnasium.ActionWrapper": [[168, "inheriting-from-gymnasium-actionwrapper"]], "Inheriting from gymnasium.ObservationWrapper": [[168, "inheriting-from-gymnasium-observationwrapper"]], "Inheriting from gymnasium.RewardWrapper": [[168, "inheriting-from-gymnasium-rewardwrapper"]], "Inheriting from gymnasium.Wrapper": [[168, "inheriting-from-gymnasium-wrapper"]], "Initializing Environments": [[158, "initializing-environments"]], "Instructions for modifying environment pages": [[1, "instructions-for-modifying-environment-pages"]], "Integration with Experiment Tracking": [[162, "integration-with-experiment-tracking"]], "Interpreting the Results": [[164, "interpreting-the-results"]], "Introduction": [[178, "introduction"]], "Inverted Double Pendulum": [[142, null]], "Inverted Pendulum": [[143, null]], "Jamesbond": [[70, null]], "Johnny Code from Youtube": [[172, "johnny-code-from-youtube"]], "Journey Escape": [[71, null]], "Kaboom": [[72, null]], "Kangaroo": [[73, null]], "Key Changes Breakdown": [[161, "key-changes-breakdown"]], "Key Design Questions": [[159, "key-design-questions"]], "Keystone Kapers": [[74, null]], "King Kong": [[75, null]], "Klax": [[76, null]], "Koolaid": [[77, null]], "Krull": [[78, null]], "Kung Fu Master": [[79, null]], "Laser Gates": [[80, null]], "List of Wrappers": [[20, null]], "Load custom quadruped robot environments": [[170, null]], "Loading OpenAI Gym environments": [[160, "loading-openai-gym-environments"]], "Lost Luggage": [[81, null]], "Lunar Lander": [[129, null]], "Make and register": [[4, null]], "Make your own custom environment": [[166, null]], "Making Vector Environments": [[10, "making-vector-environments"]], "Manual Testing with Known Actions": [[159, "manual-testing-with-known-actions"]], "Map size: 11 \\times 11": [[175, "map-size-11-times-11"]], "Map size: 4 \\times 4": [[175, "map-size-4-times-4"]], "Map size: 7 \\times 7": [[175, "map-size-7-times-7"]], "Map size: 9 \\times 9": [[175, "map-size-9-times-9"]], "Mario Bros": [[82, null]], "Mathematics / Computational": [[148, "mathematics-computational"]], "Methods": [[2, "methods"], [5, "methods"], [10, "methods"], [15, "methods"]], "Migration Guide - v0.21 to v1.0.0": [[161, null]], "Miniature Golf": [[83, null]], "Misc Wrappers": [[17, null]], "Miscellaneous": [[13, "miscellaneous"]], "Modifying the environment": [[158, "modifying-the-environment"]], "Montezuma Revenge": [[84, null]], "More Information": [[162, "more-information"]], "Mountain Car": [[133, null]], "Mountain Car Continuous": [[134, null]], "Mr Do": [[85, null]], "Ms Pacman": [[86, null]], "MuJoCo": [[136, null]], "Name This Game": [[87, null]], "New v0.26+ Code (Including v1.0.0)": [[161, "new-v0-26-code-including-v1-0-0"]], "Next Steps": [[158, "next-steps"], [159, "next-steps"], [164, "next-steps"]], "Notes": [[129, "notes"], [146, "notes"]], "Notice": [[178, "notice"]], "Observation Space": [[127, "observation-space"], [128, "observation-space"], [129, "observation-space"], [131, "observation-space"], [132, "observation-space"], [133, "observation-space"], [134, "observation-space"], [135, "observation-space"], [137, "observation-space"], [138, "observation-space"], [139, "observation-space"], [140, "observation-space"], [141, "observation-space"], [142, "observation-space"], [143, "observation-space"], [144, "observation-space"], [145, "observation-space"], [146, "observation-space"], [147, "observation-space"], [150, "observation-space"], [151, "observation-space"], [152, "observation-space"], [153, "observation-space"], [154, "observation-space"]], "Observation Wrappers": [[18, null]], "Observing the environment": [[174, "observing-the-environment"]], "Old to New Step API Compatibility": [[9, "old-to-new-step-api-compatibility"]], "Old v0.21 Code": [[161, "old-v0-21-code"]], "Optimizing training": [[163, "optimizing-training"]], "Othello": [[88, null]], "Other": [[148, "other"]], "Other environments": [[148, "other-environments"]], "Other steps": [[1, "other-steps"]], "Pacman": [[89, null]], "Parameterized Environments": [[159, "parameterized-environments"]], "Parameters we\u2019ll use": [[175, "parameters-we-ll-use"]], "Pendulum": [[135, null]], "Performance Analysis of Synchronous and Asynchronous Vectorized Environments": [[178, "performance-analysis-of-synchronous-and-asynchronous-vectorized-environments"]], "Phoenix": [[90, null]], "Pitfall": [[91, null]], "Pitfall2": [[92, null]], "Plot learning curve": [[177, "plot-learning-curve"]], "Plotting": [[178, "plotting"]], "Policy Network": [[177, "policy-network"]], "Pong": [[93, null]], "Pooyan": [[94, null]], "Private Eye": [[95, null]], "Pusher": [[144, null]], "Q-Learning Update Migration": [[161, "q-learning-update-migration"]], "Qbert": [[96, null]], "Quick Reference: Complete Changes Table": [[161, "quick-reference-complete-changes-table"]], "Reacher": [[145, null]], "Real-World Environment Design Tips": [[159, "real-world-environment-design-tips"]], "Recommended solution": [[166, "recommended-solution"]], "Recording Agents": [[162, null]], "Recording During Training (Periodic)": [[162, "recording-during-training-periodic"]], "Recording Every Episode (Evaluation)": [[162, "recording-every-episode-evaluation"]], "References": [[128, "references"], [131, "references"], [150, "references"], [151, "references"], [152, "references"], [154, "references"], [175, "references"], [177, "references"], [178, "references"]], "Registering Envs": [[166, "registering-envs"]], "Registering and making the environment": [[159, "registering-and-making-the-environment"]], "Removed Environments": [[161, "removed-environments"]], "Rendering": [[166, "rendering"]], "Rendering Arguments": [[136, "rendering-arguments"]], "Rendering Backend": [[136, "rendering-backend"]], "Reset": [[166, "reset"]], "Reset Arguments": [[128, "reset-arguments"]], "Reset function": [[159, "reset-function"]], "Reward": [[134, "reward"], [151, "reward"], [152, "reward"]], "Reward Design Issues": [[159, "reward-design-issues"]], "Reward Wrappers": [[19, null]], "Reward:": [[133, "reward"]], "Rewards": [[127, "rewards"], [128, "rewards"], [129, "rewards"], [131, "rewards"], [132, "rewards"], [135, "rewards"], [137, "rewards"], [138, "rewards"], [139, "rewards"], [140, "rewards"], [141, "rewards"], [142, "rewards"], [143, "rewards"], [144, "rewards"], [145, "rewards"], [146, "rewards"], [147, "rewards"], [150, "rewards"], [153, "rewards"], [154, "rewards"]], "Riverraid": [[97, null]], "Road Runner": [[98, null]], "Robotank": [[99, null]], "Robotics environments": [[148, "robotics-environments"], [148, "id1"]], "Running the environment": [[175, "running-the-environment"]], "Runtime Performance benchmark": [[9, "runtime-performance-benchmark"]], "Save Rendering Videos": [[9, "save-rendering-videos"]], "Saving/ Loading Weights": [[178, "saving-loading-weights"]], "Seaquest": [[100, null]], "Seeding": [[9, "seeding"]], "Setup": [[166, "setup"], [170, "setup"], [178, "setup"]], "Shared Memory for a Space": [[13, "shared-memory-for-a-space"]], "Showcase the Agent": [[178, "showcase-the-agent"]], "Side-by-Side Code Comparison": [[161, "side-by-side-code-comparison"]], "Sir Lancelot": [[101, null]], "Skiing": [[102, null]], "Solaris": [[103, null]], "Solution": [[167, "solution"]], "Solving Blackjack with Tabular Q-Learning": [[174, null]], "Solving Frozenlake with Tabular Q-Learning": [[175, null]], "Space Invaders": [[104, null]], "Space War": [[105, null]], "Spaces": [[5, null]], "Spaces Utils": [[8, null]], "Speeding Up Training": [[163, null]], "Speeding up A2C Training with Vector Envs": [[178, null]], "Star Gunner": [[106, null]], "Start Simple, Add Complexity Gradually": [[159, "start-simple-add-complexity-gradually"]], "Starting State": [[127, "starting-state"], [128, "starting-state"], [129, "starting-state"], [131, "starting-state"], [132, "starting-state"], [133, "starting-state"], [134, "starting-state"], [135, "starting-state"], [137, "starting-state"], [138, "starting-state"], [139, "starting-state"], [140, "starting-state"], [141, "starting-state"], [142, "starting-state"], [143, "starting-state"], [144, "starting-state"], [145, "starting-state"], [146, "starting-state"], [147, "starting-state"], [150, "starting-state"], [151, "starting-state"], [152, "starting-state"], [153, "starting-state"], [154, "starting-state"]], "State Representation Problems": [[159, "state-representation-problems"]], "Step": [[166, "step"]], "Step 0.1 - Download a Robot Model": [[170, "step-0-1-download-a-robot-model"]], "Step 1 - Load the model": [[170, "step-1-load-the-model"]], "Step 2 - Tweaking the Environment Parameters": [[170, "step-2-tweaking-the-environment-parameters"]], "Step 2.1 - Tweaking the Environment Simulation Parameters": [[170, "step-2-1-tweaking-the-environment-simulation-parameters"]], "Step 2.2 - Tweaking the Environment Termination Parameters": [[170, "step-2-2-tweaking-the-environment-termination-parameters"]], "Step 2.3 - Tweaking the Environment Reward Parameters": [[170, "step-2-3-tweaking-the-environment-reward-parameters"]], "Step 2.4 - Tweaking the Environment Observation Parameters": [[170, "step-2-4-tweaking-the-environment-observation-parameters"]], "Step 3 - Train your Agent": [[170, "step-3-train-your-agent"]], "Step API Compatibility": [[160, "step-api-compatibility"]], "Step function": [[159, "step-function"]], "Subclassing gymnasium.Env": [[166, "subclassing-gymnasium-env"]], "Superman": [[107, null]], "Surround": [[108, null]], "Swimmer": [[146, null]], "SyncVectorEnv": [[12, null]], "Taxi": [[154, null]], "Telecommunication Systems environments": [[148, "telecommunication-systems-environments"]], "Tennis": [[109, null]], "Termination": [[137, "termination"], [138, "termination"], [139, "termination"], [140, "termination"], [141, "termination"], [142, "termination"], [143, "termination"], [144, "termination"], [145, "termination"], [146, "termination"], [147, "termination"], [167, "termination"]], "Testing Your Migration": [[161, "testing-your-migration"]], "Testing Your Trained Agent": [[164, "testing-your-trained-agent"]], "Tetris": [[110, null]], "The FrozenLake environment": [[175, "the-frozenlake-environment"]], "The Learning Process": [[164, "the-learning-process"]], "The Training Loop": [[164, "the-training-loop"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Think About Your Research Question": [[159, "think-about-your-research-question"]], "Think you can do better?": [[174, "think-you-can-do-better"]], "Third-Party Environments using Gym": [[148, "third-party-environments-using-gym"]], "Third-Party Tutorials": [[172, null]], "Third-Party tutorials about gymnasium": [[172, "third-party-tutorials-about-gymnasium"]], "Third-Party tutorials about libraries that use gymnasium": [[172, "third-party-tutorials-about-libraries-that-use-gymnasium"]], "Third-party environments with Gymnasium": [[148, "third-party-environments-with-gymnasium"]], "Tic Tac Toe 3D": [[111, null]], "Time Pilot": [[112, null]], "TimeLimit Wrapper Changes": [[161, "timelimit-wrapper-changes"]], "Toy Text": [[149, null]], "Training Agents": [[171, "training-agents"], [173, null], [176, null]], "Training Recording Benefits": [[162, "training-recording-benefits"]], "Training an Agent": [[164, null]], "Training the A2C Agent": [[178, "training-the-a2c-agent"]], "Training the Agent": [[164, "training-the-agent"]], "Training using REINFORCE for Mujoco": [[177, null]], "Transition Dynamics:": [[133, "transition-dynamics"], [134, "transition-dynamics"]], "Trondead": [[113, null]], "Truncation": [[137, "truncation"], [138, "truncation"], [139, "truncation"], [140, "truncation"], [141, "truncation"], [142, "truncation"], [143, "truncation"], [144, "truncation"], [145, "truncation"], [146, "truncation"], [147, "truncation"], [167, "truncation"]], "Try playing the environment yourself": [[178, "try-playing-the-environment-yourself"]], "Turmoil": [[114, null]], "Tutankham": [[115, null]], "Tutorials": [[171, null]], "Uncommon Wrappers": [[17, "uncommon-wrappers"]], "Understanding Q-Learning Intuitively": [[164, "understanding-q-learning-intuitively"]], "Understanding the Agent-Environment Loop": [[158, "understanding-the-agent-environment-loop"]], "Understanding the Output": [[162, "understanding-the-output"]], "Understanding the Q-Learning Update": [[164, "understanding-the-q-learning-update"]], "Up N Down": [[116, null]], "Using Old Environments": [[161, "using-old-environments"]], "Using Vectorized Environments": [[178, "using-vectorized-environments"]], "Using Wrappers": [[159, "using-wrappers"], [166, "using-wrappers"]], "Utility functions": [[5, "utility-functions"], [9, null], [13, null]], "Vector Only wrappers": [[14, "vector-only-wrappers"]], "Vector Utility functions": [[5, "vector-utility-functions"]], "Vector only Wrappers": [[20, "vector-only-wrappers"]], "Vectorize": [[10, null]], "Vectorized Common wrappers": [[14, "vectorized-common-wrappers"]], "Vectorized environment": [[132, "vectorized-environment"]], "Vectorized environments": [[163, "vectorized-environments"]], "Vectorizing Spaces": [[13, "vectorizing-spaces"]], "Venture": [[117, null]], "Version History": [[127, "version-history"], [128, "version-history"], [129, "version-history"], [131, "version-history"], [132, "version-history"], [133, "version-history"], [134, "version-history"], [135, "version-history"], [137, "version-history"], [138, "version-history"], [139, "version-history"], [140, "version-history"], [141, "version-history"], [142, "version-history"], [143, "version-history"], [144, "version-history"], [145, "version-history"], [146, "version-history"], [147, "version-history"], [150, "version-history"], [151, "version-history"], [152, "version-history"], [153, "version-history"], [154, "version-history"]], "Versions": [[136, "versions"]], "Video Checkers": [[118, null]], "Video Chess": [[119, null]], "Video Cube": [[120, null]], "Video Game environments": [[148, "video-game-environments"]], "Video Pinball": [[121, null]], "Visualising the policy": [[174, "visualising-the-policy"]], "Visualization": [[9, "visualization"], [175, "visualization"]], "Visualizing the training": [[174, "visualizing-the-training"]], "Walker2D": [[147, null]], "What is Reinforcement Learning?": [[158, "what-is-reinforcement-learning"]], "What to Expect During Training": [[164, "what-to-expect-during-training"]], "When to Record": [[162, "when-to-record"]], "Who Should Read This Guide?": [[161, "who-should-read-this-guide"]], "Why Did the API Change?": [[161, "why-did-the-api-change"]], "Why Gymnasium?": [[158, "why-gymnasium"]], "Why Record Your Agent?": [[162, "why-record-your-agent"]], "Wizard Of Wor": [[122, null]], "Word Zapper": [[123, null]], "Wrappers": [[14, null], [15, null]], "Writing Tutorials": [[1, "writing-tutorials"]], "Yars Revenge": [[124, null]], "Your First RL Program": [[158, "your-first-rl-program"]], "Zaxxon": [[125, null]], "freeCodeCamp from Youtube": [[172, "freecodecamp-from-youtube"]], "v0.20.0": [[155, "release-v0-20-0"]], "v0.21.0": [[155, "release-v0-21-0"]], "v0.26.0: Initial Release": [[156, "release-v0-26-0"]], "v0.26.1": [[156, "release-v0-26-1"]], "v0.26.2 ": [[156, "release-v0-26-2"]], "v0.26.3": [[156, "release-v0-26-3"]], "v0.27.0": [[156, "release-v0-27-0"]], "v0.27.1": [[156, "release-v0-27-1"]], "v0.28.0": [[156, "release-v0-28-0"]], "v0.28.1": [[156, "release-v0-28-1"]], "v0.29.0": [[156, "release-v0-29-0"]], "v0.29.1 ": [[156, "release-v0-29-1"]], "v0.7.3": [[155, "release-v0-7-3"]], "v0.7.4": [[155, "release-v0-7-4"]], "v0.9.5": [[155, "release-v0-9-5"]], "v0.9.6": [[155, "release-v0-9-6"]], "v1.0.0": [[156, "release-v1-0-0"]], "v1.0.0a1: v1.0.0 alpha1 ": [[156, "release-v1-0-0a1"]], "v1.0.0a2: v1.0.0 alpha 2": [[156, "release-v1-0-0a2"]], "v1.1.0": [[156, "release-v1-1-0"]], "v1.2.0": [[156, "release-v1-2-0"]], "\ud83d\udea8 Agent Gets Stuck in Poor Strategy": [[164, "agent-gets-stuck-in-poor-strategy"]], "\ud83d\udea8 Agent Never Improves": [[164, "agent-never-improves"]], "\ud83d\udea8 Learning Too Slow": [[164, "learning-too-slow"]], "\ud83d\udea8 Unstable Training": [[164, "unstable-training"]]}, "docnames": ["404", "README", "api/env", "api/functional", "api/registry", "api/spaces", "api/spaces/composite", "api/spaces/fundamental", "api/spaces/utils", "api/utils", "api/vector", "api/vector/async_vector_env", "api/vector/sync_vector_env", "api/vector/utils", "api/vector/wrappers", "api/wrappers", "api/wrappers/action_wrappers", "api/wrappers/misc_wrappers", "api/wrappers/observation_wrappers", "api/wrappers/reward_wrappers", "api/wrappers/table", "environments/atari", "environments/atari/adventure", "environments/atari/air_raid", "environments/atari/alien", "environments/atari/amidar", "environments/atari/assault", "environments/atari/asterix", "environments/atari/asteroids", "environments/atari/atlantis", "environments/atari/atlantis2", "environments/atari/backgammon", "environments/atari/bank_heist", "environments/atari/basic_math", "environments/atari/battle_zone", "environments/atari/beam_rider", "environments/atari/berzerk", "environments/atari/blackjack", "environments/atari/bowling", "environments/atari/boxing", "environments/atari/breakout", "environments/atari/carnival", "environments/atari/casino", "environments/atari/centipede", "environments/atari/chopper_command", "environments/atari/crazy_climber", "environments/atari/crossbow", "environments/atari/darkchambers", "environments/atari/defender", "environments/atari/demon_attack", "environments/atari/donkey_kong", "environments/atari/double_dunk", "environments/atari/earthworld", "environments/atari/elevator_action", "environments/atari/enduro", "environments/atari/entombed", "environments/atari/et", "environments/atari/fishing_derby", "environments/atari/flag_capture", "environments/atari/freeway", "environments/atari/frogger", "environments/atari/frostbite", "environments/atari/galaxian", "environments/atari/gopher", "environments/atari/gravitar", "environments/atari/hangman", "environments/atari/haunted_house", "environments/atari/hero", "environments/atari/human_cannonball", "environments/atari/ice_hockey", "environments/atari/jamesbond", "environments/atari/journey_escape", "environments/atari/kaboom", "environments/atari/kangaroo", "environments/atari/keystone_kapers", "environments/atari/king_kong", "environments/atari/klax", "environments/atari/koolaid", "environments/atari/krull", "environments/atari/kung_fu_master", "environments/atari/laser_gates", "environments/atari/lost_luggage", "environments/atari/mario_bros", "environments/atari/miniature_golf", "environments/atari/montezuma_revenge", "environments/atari/mr_do", "environments/atari/ms_pacman", "environments/atari/name_this_game", "environments/atari/othello", "environments/atari/pacman", "environments/atari/phoenix", "environments/atari/pitfall", "environments/atari/pitfall2", "environments/atari/pong", "environments/atari/pooyan", "environments/atari/private_eye", "environments/atari/qbert", "environments/atari/riverraid", "environments/atari/road_runner", "environments/atari/robotank", "environments/atari/seaquest", "environments/atari/sir_lancelot", "environments/atari/skiing", "environments/atari/solaris", "environments/atari/space_invaders", "environments/atari/space_war", "environments/atari/star_gunner", "environments/atari/superman", "environments/atari/surround", "environments/atari/tennis", "environments/atari/tetris", "environments/atari/tic_tac_toe_3d", "environments/atari/time_pilot", "environments/atari/trondead", "environments/atari/turmoil", "environments/atari/tutankham", "environments/atari/up_n_down", "environments/atari/venture", "environments/atari/video_checkers", "environments/atari/video_chess", "environments/atari/video_cube", "environments/atari/video_pinball", "environments/atari/wizard_of_wor", "environments/atari/word_zapper", "environments/atari/yars_revenge", "environments/atari/zaxxon", "environments/box2d", "environments/box2d/bipedal_walker", "environments/box2d/car_racing", "environments/box2d/lunar_lander", "environments/classic_control", "environments/classic_control/acrobot", "environments/classic_control/cart_pole", "environments/classic_control/mountain_car", "environments/classic_control/mountain_car_continuous", "environments/classic_control/pendulum", "environments/mujoco", "environments/mujoco/ant", "environments/mujoco/half_cheetah", "environments/mujoco/hopper", "environments/mujoco/humanoid", "environments/mujoco/humanoid_standup", "environments/mujoco/inverted_double_pendulum", "environments/mujoco/inverted_pendulum", "environments/mujoco/pusher", "environments/mujoco/reacher", "environments/mujoco/swimmer", "environments/mujoco/walker2d", "environments/third_party_environments", "environments/toy_text", "environments/toy_text/blackjack", "environments/toy_text/cliff_walking", "environments/toy_text/cliff_walking_slippery", "environments/toy_text/frozen_lake", "environments/toy_text/taxi", "gym_release_notes/index", "gymnasium_release_notes/index", "index", "introduction/basic_usage", "introduction/create_custom_env", "introduction/gym_compatibility", "introduction/migration_guide", "introduction/record_agent", "introduction/speed_up_env", "introduction/train_agent", "tutorials/gymnasium_basics/README", "tutorials/gymnasium_basics/environment_creation", "tutorials/gymnasium_basics/handling_time_limits", "tutorials/gymnasium_basics/implementing_custom_wrappers", "tutorials/gymnasium_basics/index", "tutorials/gymnasium_basics/load_quadruped_model", "tutorials/index", "tutorials/third-party-tutorials", "tutorials/training_agents/README", "tutorials/training_agents/blackjack_q_learning", "tutorials/training_agents/frozenlake_q_learning", "tutorials/training_agents/index", "tutorials/training_agents/mujoco_reinforce", "tutorials/training_agents/vector_a2c"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1}, "filenames": ["404.md", "README.md", "api/env.md", "api/functional.md", "api/registry.md", "api/spaces.md", "api/spaces/composite.md", "api/spaces/fundamental.md", "api/spaces/utils.md", "api/utils.md", "api/vector.md", "api/vector/async_vector_env.md", "api/vector/sync_vector_env.md", "api/vector/utils.md", "api/vector/wrappers.md", "api/wrappers.md", "api/wrappers/action_wrappers.md", "api/wrappers/misc_wrappers.md", "api/wrappers/observation_wrappers.md", "api/wrappers/reward_wrappers.md", "api/wrappers/table.md", "environments/atari.md", "environments/atari/adventure.md", "environments/atari/air_raid.md", "environments/atari/alien.md", "environments/atari/amidar.md", "environments/atari/assault.md", "environments/atari/asterix.md", "environments/atari/asteroids.md", "environments/atari/atlantis.md", "environments/atari/atlantis2.md", "environments/atari/backgammon.md", "environments/atari/bank_heist.md", "environments/atari/basic_math.md", "environments/atari/battle_zone.md", "environments/atari/beam_rider.md", "environments/atari/berzerk.md", "environments/atari/blackjack.md", "environments/atari/bowling.md", "environments/atari/boxing.md", "environments/atari/breakout.md", "environments/atari/carnival.md", "environments/atari/casino.md", "environments/atari/centipede.md", "environments/atari/chopper_command.md", "environments/atari/crazy_climber.md", "environments/atari/crossbow.md", "environments/atari/darkchambers.md", "environments/atari/defender.md", "environments/atari/demon_attack.md", "environments/atari/donkey_kong.md", "environments/atari/double_dunk.md", "environments/atari/earthworld.md", "environments/atari/elevator_action.md", "environments/atari/enduro.md", "environments/atari/entombed.md", "environments/atari/et.md", "environments/atari/fishing_derby.md", "environments/atari/flag_capture.md", "environments/atari/freeway.md", "environments/atari/frogger.md", "environments/atari/frostbite.md", "environments/atari/galaxian.md", "environments/atari/gopher.md", "environments/atari/gravitar.md", "environments/atari/hangman.md", "environments/atari/haunted_house.md", "environments/atari/hero.md", "environments/atari/human_cannonball.md", "environments/atari/ice_hockey.md", "environments/atari/jamesbond.md", "environments/atari/journey_escape.md", "environments/atari/kaboom.md", "environments/atari/kangaroo.md", "environments/atari/keystone_kapers.md", "environments/atari/king_kong.md", "environments/atari/klax.md", "environments/atari/koolaid.md", "environments/atari/krull.md", "environments/atari/kung_fu_master.md", "environments/atari/laser_gates.md", "environments/atari/lost_luggage.md", "environments/atari/mario_bros.md", "environments/atari/miniature_golf.md", "environments/atari/montezuma_revenge.md", "environments/atari/mr_do.md", "environments/atari/ms_pacman.md", "environments/atari/name_this_game.md", "environments/atari/othello.md", "environments/atari/pacman.md", "environments/atari/phoenix.md", "environments/atari/pitfall.md", "environments/atari/pitfall2.md", "environments/atari/pong.md", "environments/atari/pooyan.md", "environments/atari/private_eye.md", "environments/atari/qbert.md", "environments/atari/riverraid.md", "environments/atari/road_runner.md", "environments/atari/robotank.md", "environments/atari/seaquest.md", "environments/atari/sir_lancelot.md", "environments/atari/skiing.md", "environments/atari/solaris.md", "environments/atari/space_invaders.md", "environments/atari/space_war.md", "environments/atari/star_gunner.md", "environments/atari/superman.md", "environments/atari/surround.md", "environments/atari/tennis.md", "environments/atari/tetris.md", "environments/atari/tic_tac_toe_3d.md", "environments/atari/time_pilot.md", "environments/atari/trondead.md", "environments/atari/turmoil.md", "environments/atari/tutankham.md", "environments/atari/up_n_down.md", "environments/atari/venture.md", "environments/atari/video_checkers.md", "environments/atari/video_chess.md", "environments/atari/video_cube.md", "environments/atari/video_pinball.md", "environments/atari/wizard_of_wor.md", "environments/atari/word_zapper.md", "environments/atari/yars_revenge.md", "environments/atari/zaxxon.md", "environments/box2d.md", "environments/box2d/bipedal_walker.md", "environments/box2d/car_racing.md", "environments/box2d/lunar_lander.md", "environments/classic_control.md", "environments/classic_control/acrobot.md", "environments/classic_control/cart_pole.md", "environments/classic_control/mountain_car.md", "environments/classic_control/mountain_car_continuous.md", "environments/classic_control/pendulum.md", "environments/mujoco.md", "environments/mujoco/ant.md", "environments/mujoco/half_cheetah.md", "environments/mujoco/hopper.md", "environments/mujoco/humanoid.md", "environments/mujoco/humanoid_standup.md", "environments/mujoco/inverted_double_pendulum.md", "environments/mujoco/inverted_pendulum.md", "environments/mujoco/pusher.md", "environments/mujoco/reacher.md", "environments/mujoco/swimmer.md", "environments/mujoco/walker2d.md", "environments/third_party_environments.md", "environments/toy_text.md", "environments/toy_text/blackjack.md", "environments/toy_text/cliff_walking.md", "environments/toy_text/cliff_walking_slippery.md", "environments/toy_text/frozen_lake.md", "environments/toy_text/taxi.md", "gym_release_notes/index.md", "gymnasium_release_notes/index.md", "index.md", "introduction/basic_usage.md", "introduction/create_custom_env.md", "introduction/gym_compatibility.md", "introduction/migration_guide.md", "introduction/record_agent.md", "introduction/speed_up_env.md", "introduction/train_agent.md", "tutorials/gymnasium_basics/README.rst", "tutorials/gymnasium_basics/environment_creation.rst", "tutorials/gymnasium_basics/handling_time_limits.rst", "tutorials/gymnasium_basics/implementing_custom_wrappers.rst", "tutorials/gymnasium_basics/index.rst", "tutorials/gymnasium_basics/load_quadruped_model.rst", "tutorials/index.rst", "tutorials/third-party-tutorials.md", "tutorials/training_agents/README.rst", "tutorials/training_agents/blackjack_q_learning.rst", "tutorials/training_agents/frozenlake_q_learning.rst", "tutorials/training_agents/index.rst", "tutorials/training_agents/mujoco_reinforce.rst", "tutorials/training_agents/vector_a2c.rst"], "indexentries": {"action() (gymnasium.actionwrapper method)": [[16, "gymnasium.ActionWrapper.action", false]], "action_space (gymnasium.env attribute)": [[2, "gymnasium.Env.action_space", false]], "action_space (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.action_space", false]], "action_space (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.action_space", false]], "actions() (gymnasium.vector.vectoractionwrapper method)": [[14, "gymnasium.vector.VectorActionWrapper.actions", false]], "actionwrapper (class in gymnasium)": [[16, "gymnasium.ActionWrapper", false]], "addrenderobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.AddRenderObservation", false]], "arrayconversion (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.ArrayConversion", false]], "arrayconversion (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ArrayConversion", false]], "asyncvectorenv (class in gymnasium.vector)": [[11, "gymnasium.vector.AsyncVectorEnv", false]], "ataripreprocessing (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.AtariPreprocessing", false]], "autoreset (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.Autoreset", false]], "batch_space() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.batch_space", false]], "benchmark_init() (in module gymnasium.utils.performance)": [[9, "gymnasium.utils.performance.benchmark_init", false]], "benchmark_render() (in module gymnasium.utils.performance)": [[9, "gymnasium.utils.performance.benchmark_render", false]], "benchmark_step() (in module gymnasium.utils.performance)": [[9, "gymnasium.utils.performance.benchmark_step", false]], "box (class in gymnasium.spaces)": [[7, "gymnasium.spaces.Box", false]], "call() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.call", false]], "call() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.call", false]], "callback() (gymnasium.utils.play.playplot method)": [[9, "gymnasium.utils.play.PlayPlot.callback", false]], "capped_cubic_video_schedule() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.capped_cubic_video_schedule", false]], "check_env() (in module gymnasium.utils.env_checker)": [[9, "gymnasium.utils.env_checker.check_env", false]], "clear_mpi_env_vars() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.clear_mpi_env_vars", false]], "clipaction (class in gymnasium.wrappers)": [[16, "gymnasium.wrappers.ClipAction", false]], "clipaction (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ClipAction", false]], "clipreward (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.ClipReward", false]], "clipreward (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ClipReward", false]], "close() (gymnasium.env method)": [[2, "gymnasium.Env.close", false]], "close() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.close", false]], "close() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.close", false]], "close() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.close", false]], "close() (gymnasium.vector.vectorwrapper method)": [[14, "gymnasium.vector.VectorWrapper.close", false]], "close() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.close", false]], "closed (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.closed", false]], "cloudpicklewrapper() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.CloudpickleWrapper", false]], "concatenate() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.concatenate", false]], "contains() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.contains", false]], "convert_to_done_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_done_step_api", false]], "convert_to_terminated_truncated_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_terminated_truncated_step_api", false]], "create_empty_array() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.create_empty_array", false]], "create_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.create_shared_memory", false]], "current_namespace (gymnasium.envs.registration attribute)": [[4, "gymnasium.envs.registration.current_namespace", false]], "delayobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.DelayObservation", false]], "dict (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Dict", false]], "dictinfotolist (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.DictInfoToList", false]], "discrete (class in gymnasium.spaces)": [[7, "gymnasium.spaces.Discrete", false]], "dtype (gymnasium.spaces.space property)": [[5, "gymnasium.spaces.Space.dtype", false]], "dtypeobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.DtypeObservation", false]], "dtypeobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.DtypeObservation", false]], "env (class in gymnasium)": [[2, "gymnasium.Env", false]], "env (gymnasium.wrapper attribute)": [[15, "gymnasium.Wrapper.env", false]], "envspec (class in gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.EnvSpec", false]], "ezpickle (class in gymnasium.utils.ezpickle)": [[9, "gymnasium.utils.ezpickle.EzPickle", false]], "filterobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.FilterObservation", false]], "filterobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.FilterObservation", false]], "find_highest_version() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.find_highest_version", false]], "flatdim() (in module gymnasium.spaces.utils)": [[8, "gymnasium.spaces.utils.flatdim", false]], "flatten() (in module gymnasium.spaces.utils)": [[8, "gymnasium.spaces.utils.flatten", false]], "flatten_space() (in module gymnasium.spaces.utils)": [[8, "gymnasium.spaces.utils.flatten_space", false]], "flattenobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.FlattenObservation", false]], "flattenobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.FlattenObservation", false]], "framestackobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.FrameStackObservation", false]], "from_jsonable() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.from_jsonable", false]], "funcenv (class in gymnasium.experimental.functional)": [[3, "gymnasium.experimental.functional.FuncEnv", false]], "functionaljaxenv (class in gymnasium.envs.functional_jax_env)": [[3, "gymnasium.envs.functional_jax_env.FunctionalJaxEnv", false]], "get_attr() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.get_attr", false]], "get_attr() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.get_attr", false]], "get_env_id() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.get_env_id", false]], "get_wrapper_attr() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.get_wrapper_attr", false]], "graph (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Graph", false]], "grayscaleobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.GrayscaleObservation", false]], "grayscaleobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.GrayscaleObservation", false]], "gymnasium.spaces": [[5, "module-gymnasium.spaces", false]], "gymnasium.wrappers": [[15, "module-gymnasium.wrappers", false]], "humanrendering (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.HumanRendering", false]], "initial() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.initial", false]], "is_bounded() (gymnasium.spaces.box method)": [[7, "gymnasium.spaces.Box.is_bounded", false]], "is_np_flattenable (gymnasium.spaces.space property)": [[5, "gymnasium.spaces.Space.is_np_flattenable", false]], "iterate() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.iterate", false]], "jaxtonumpy (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.JaxToNumpy", false]], "jaxtonumpy (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.JaxToNumpy", false]], "jaxtotorch (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.JaxToTorch", false]], "jaxtotorch (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.JaxToTorch", false]], "load_env_creator() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.load_env_creator", false]], "make() (in module gymnasium)": [[4, "gymnasium.make", false]], "make_vec() (in module gymnasium)": [[4, "gymnasium.make_vec", false]], "maxandskipobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.MaxAndSkipObservation", false]], "metadata (gymnasium.env attribute)": [[2, "gymnasium.Env.metadata", false]], "metadata (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.metadata", false]], "metadata (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.metadata", false]], "module": [[5, "module-gymnasium.spaces", false], [15, "module-gymnasium.wrappers", false]], "multibinary (class in gymnasium.spaces)": [[7, "gymnasium.spaces.MultiBinary", false]], "multidiscrete (class in gymnasium.spaces)": [[7, "gymnasium.spaces.MultiDiscrete", false]], "namespace() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.namespace", false]], "normalizeobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.NormalizeObservation", false]], "normalizeobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.NormalizeObservation", false]], "normalizereward (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.NormalizeReward", false]], "normalizereward (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.NormalizeReward", false]], "np_random (gymnasium.env property)": [[2, "gymnasium.Env.np_random", false]], "np_random (gymnasium.spaces.space property)": [[5, "gymnasium.spaces.Space.np_random", false]], "np_random (gymnasium.vector.asyncvectorenv property)": [[11, "gymnasium.vector.AsyncVectorEnv.np_random", false]], "np_random (gymnasium.vector.syncvectorenv property)": [[12, "gymnasium.vector.SyncVectorEnv.np_random", false]], "np_random (gymnasium.vector.vectorenv property)": [[10, "gymnasium.vector.VectorEnv.np_random", false]], "np_random (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.np_random", false]], "np_random() (in module gymnasium.utils.seeding)": [[9, "gymnasium.utils.seeding.np_random", false]], "np_random_seed (gymnasium.env property)": [[2, "gymnasium.Env.np_random_seed", false]], "np_random_seed (gymnasium.vector.asyncvectorenv property)": [[11, "gymnasium.vector.AsyncVectorEnv.np_random_seed", false]], "np_random_seed (gymnasium.vector.syncvectorenv property)": [[12, "gymnasium.vector.SyncVectorEnv.np_random_seed", false]], "np_random_seed (gymnasium.vector.vectorenv property)": [[10, "gymnasium.vector.VectorEnv.np_random_seed", false]], "np_random_seed (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.np_random_seed", false]], "num_envs (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.num_envs", false]], "numpytotorch (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.NumpyToTorch", false]], "numpytotorch (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.NumpyToTorch", false]], "observation() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.observation", false]], "observation() (gymnasium.observationwrapper method)": [[18, "gymnasium.ObservationWrapper.observation", false]], "observation_space (gymnasium.env attribute)": [[2, "gymnasium.Env.observation_space", false]], "observation_space (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.observation_space", false]], "observation_space (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.observation_space", false]], "observations() (gymnasium.vector.vectorobservationwrapper method)": [[14, "gymnasium.vector.VectorObservationWrapper.observations", false]], "observationwrapper (class in gymnasium)": [[18, "gymnasium.ObservationWrapper", false]], "oneof (class in gymnasium.spaces)": [[6, "gymnasium.spaces.OneOf", false]], "orderenforcing (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.OrderEnforcing", false]], "parse_env_id() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.parse_env_id", false]], "passiveenvchecker (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.PassiveEnvChecker", false]], "play() (in module gymnasium.utils.play)": [[9, "gymnasium.utils.play.play", false]], "playablegame (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayableGame", false]], "playplot (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayPlot", false]], "pprint_registry() (in module gymnasium)": [[4, "gymnasium.pprint_registry", false]], "process_event() (gymnasium.utils.play.playablegame method)": [[9, "gymnasium.utils.play.PlayableGame.process_event", false]], "read_from_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.read_from_shared_memory", false]], "recordepisodestatistics (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.RecordEpisodeStatistics", false]], "recordepisodestatistics (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.RecordEpisodeStatistics", false]], "recordvideo (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.RecordVideo", false]], "register() (in module gymnasium)": [[4, "gymnasium.register", false]], "registry (gymnasium.envs.registration attribute)": [[4, "gymnasium.envs.registration.registry", false]], "render() (gymnasium.env method)": [[2, "gymnasium.Env.render", false]], "render() (gymnasium.envs.functional_jax_env.functionaljaxenv method)": [[3, "gymnasium.envs.functional_jax_env.FunctionalJaxEnv.render", false]], "render() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.render", false]], "render() (gymnasium.vector.vectorwrapper method)": [[14, "gymnasium.vector.VectorWrapper.render", false]], "render() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.render", false]], "render_close() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.render_close", false]], "render_image() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.render_image", false]], "render_init() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.render_init", false]], "render_mode (gymnasium.env attribute)": [[2, "gymnasium.Env.render_mode", false]], "render_mode (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.render_mode", false]], "rendercollection (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.RenderCollection", false]], "rescaleaction (class in gymnasium.wrappers)": [[16, "gymnasium.wrappers.RescaleAction", false]], "rescaleaction (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.RescaleAction", false]], "rescaleobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.RescaleObservation", false]], "rescaleobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.RescaleObservation", false]], "reset() (gymnasium.env method)": [[2, "gymnasium.Env.reset", false]], "reset() (gymnasium.envs.functional_jax_env.functionaljaxenv method)": [[3, "gymnasium.envs.functional_jax_env.FunctionalJaxEnv.reset", false]], "reset() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.reset", false]], "reset() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.reset", false]], "reset() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.reset", false]], "reset() (gymnasium.vector.vectorwrapper method)": [[14, "gymnasium.vector.VectorWrapper.reset", false]], "reset() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.reset", false]], "reshapeobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.ReshapeObservation", false]], "reshapeobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ReshapeObservation", false]], "resizeobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.ResizeObservation", false]], "resizeobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ResizeObservation", false]], "reward() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.reward", false]], "reward() (gymnasium.rewardwrapper method)": [[19, "gymnasium.RewardWrapper.reward", false]], "rewards() (gymnasium.vector.vectorrewardwrapper method)": [[14, "gymnasium.vector.VectorRewardWrapper.rewards", false]], "rewardwrapper (class in gymnasium)": [[19, "gymnasium.RewardWrapper", false]], "sample() (gymnasium.spaces.box method)": [[7, "gymnasium.spaces.Box.sample", false]], "sample() (gymnasium.spaces.dict method)": [[6, "gymnasium.spaces.Dict.sample", false]], "sample() (gymnasium.spaces.discrete method)": [[7, "gymnasium.spaces.Discrete.sample", false]], "sample() (gymnasium.spaces.graph method)": [[6, "gymnasium.spaces.Graph.sample", false]], "sample() (gymnasium.spaces.multibinary method)": [[7, "gymnasium.spaces.MultiBinary.sample", false]], "sample() (gymnasium.spaces.multidiscrete method)": [[7, "gymnasium.spaces.MultiDiscrete.sample", false]], "sample() (gymnasium.spaces.oneof method)": [[6, "gymnasium.spaces.OneOf.sample", false]], "sample() (gymnasium.spaces.sequence method)": [[6, "gymnasium.spaces.Sequence.sample", false]], "sample() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.sample", false]], "sample() (gymnasium.spaces.text method)": [[7, "gymnasium.spaces.Text.sample", false]], "sample() (gymnasium.spaces.tuple method)": [[6, "gymnasium.spaces.Tuple.sample", false]], "save_video() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.save_video", false]], "seed() (gymnasium.spaces.box method)": [[7, "gymnasium.spaces.Box.seed", false]], "seed() (gymnasium.spaces.dict method)": [[6, "gymnasium.spaces.Dict.seed", false]], "seed() (gymnasium.spaces.discrete method)": [[7, "gymnasium.spaces.Discrete.seed", false]], "seed() (gymnasium.spaces.graph method)": [[6, "gymnasium.spaces.Graph.seed", false]], "seed() (gymnasium.spaces.multibinary method)": [[7, "gymnasium.spaces.MultiBinary.seed", false]], "seed() (gymnasium.spaces.multidiscrete method)": [[7, "gymnasium.spaces.MultiDiscrete.seed", false]], "seed() (gymnasium.spaces.oneof method)": [[6, "gymnasium.spaces.OneOf.seed", false]], "seed() (gymnasium.spaces.sequence method)": [[6, "gymnasium.spaces.Sequence.seed", false]], "seed() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.seed", false]], "seed() (gymnasium.spaces.text method)": [[7, "gymnasium.spaces.Text.seed", false]], "seed() (gymnasium.spaces.tuple method)": [[6, "gymnasium.spaces.Tuple.seed", false]], "sequence (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Sequence", false]], "set_attr() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.set_attr", false]], "set_attr() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.set_attr", false]], "set_wrapper_attr() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.set_wrapper_attr", false]], "shape (gymnasium.spaces.space property)": [[5, "gymnasium.spaces.Space.shape", false]], "single_action_space (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.single_action_space", false]], "single_observation_space (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.single_observation_space", false]], "space (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Space", false]], "spec (gymnasium.env attribute)": [[2, "gymnasium.Env.spec", false]], "spec (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.spec", false]], "spec (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.spec", false]], "spec() (in module gymnasium)": [[4, "gymnasium.spec", false]], "state_info() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.state_info", false]], "step() (gymnasium.env method)": [[2, "gymnasium.Env.step", false]], "step() (gymnasium.envs.functional_jax_env.functionaljaxenv method)": [[3, "gymnasium.envs.functional_jax_env.FunctionalJaxEnv.step", false]], "step() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.step", false]], "step() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.step", false]], "step() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.step", false]], "step() (gymnasium.vector.vectorwrapper method)": [[14, "gymnasium.vector.VectorWrapper.step", false]], "step() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.step", false]], "step_api_compatibility() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.step_api_compatibility", false]], "stickyaction (class in gymnasium.wrappers)": [[16, "gymnasium.wrappers.StickyAction", false]], "syncvectorenv (class in gymnasium.vector)": [[12, "gymnasium.vector.SyncVectorEnv", false]], "terminal() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.terminal", false]], "text (class in gymnasium.spaces)": [[7, "gymnasium.spaces.Text", false]], "timeawareobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.TimeAwareObservation", false]], "timelimit (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.TimeLimit", false]], "to_jsonable() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.to_jsonable", false]], "transform() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.transform", false]], "transformaction (class in gymnasium.wrappers)": [[16, "gymnasium.wrappers.TransformAction", false]], "transformaction (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.TransformAction", false]], "transformobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.TransformObservation", false]], "transformobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.TransformObservation", false]], "transformreward (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.TransformReward", false]], "transformreward (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.TransformReward", false]], "transition() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.transition", false]], "transition_info() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.transition_info", false]], "tuple (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Tuple", false]], "unflatten() (in module gymnasium.spaces.utils)": [[8, "gymnasium.spaces.utils.unflatten", false]], "unwrapped (gymnasium.env property)": [[2, "gymnasium.Env.unwrapped", false]], "unwrapped (gymnasium.vector.vectorenv property)": [[10, "gymnasium.vector.VectorEnv.unwrapped", false]], "unwrapped (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.unwrapped", false]], "vectoractionwrapper (class in gymnasium.vector)": [[14, "gymnasium.vector.VectorActionWrapper", false]], "vectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.VectorEnv", false]], "vectorizetransformaction (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.VectorizeTransformAction", false]], "vectorizetransformobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.VectorizeTransformObservation", false]], "vectorizetransformreward (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.VectorizeTransformReward", false]], "vectorobservationwrapper (class in gymnasium.vector)": [[14, "gymnasium.vector.VectorObservationWrapper", false]], "vectorrewardwrapper (class in gymnasium.vector)": [[14, "gymnasium.vector.VectorRewardWrapper", false]], "vectorwrapper (class in gymnasium.vector)": [[14, "gymnasium.vector.VectorWrapper", false]], "wrapper (class in gymnasium)": [[15, "gymnasium.Wrapper", false]], "wrapper_spec() (gymnasium.wrapper class method)": [[15, "gymnasium.Wrapper.wrapper_spec", false]], "wrapperspec (class in gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.WrapperSpec", false]], "write_to_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.write_to_shared_memory", false]]}, "objects": {"gymnasium": [[16, 0, 1, "", "ActionWrapper"], [2, 0, 1, "", "Env"], [18, 0, 1, "", "ObservationWrapper"], [19, 0, 1, "", "RewardWrapper"], [15, 0, 1, "", "Wrapper"], [4, 4, 1, "", "make"], [4, 4, 1, "", "make_vec"], [4, 4, 1, "", "pprint_registry"], [4, 4, 1, "", "register"], [5, 5, 0, "-", "spaces"], [4, 4, 1, "", "spec"], [15, 5, 0, "-", "wrappers"]], "gymnasium.ActionWrapper": [[16, 1, 1, "", "action"]], "gymnasium.Env": [[2, 2, 1, "", "action_space"], [2, 1, 1, "", "close"], [2, 2, 1, "", "metadata"], [2, 3, 1, "", "np_random"], [2, 3, 1, "", "np_random_seed"], [2, 2, 1, "", "observation_space"], [2, 1, 1, "", "render"], [2, 2, 1, "", "render_mode"], [2, 1, 1, "", "reset"], [2, 2, 1, "", "spec"], [2, 1, 1, "", "step"], [2, 3, 1, "", "unwrapped"]], "gymnasium.ObservationWrapper": [[18, 1, 1, "", "observation"]], "gymnasium.RewardWrapper": [[19, 1, 1, "", "reward"]], "gymnasium.Wrapper": [[15, 3, 1, "", "action_space"], [15, 1, 1, "", "close"], [15, 2, 1, "", "env"], [15, 1, 1, "", "get_wrapper_attr"], [15, 3, 1, "", "metadata"], [15, 3, 1, "", "np_random"], [15, 3, 1, "", "np_random_seed"], [15, 3, 1, "", "observation_space"], [15, 1, 1, "", "render"], [15, 1, 1, "", "reset"], [15, 1, 1, "", "set_wrapper_attr"], [15, 3, 1, "", "spec"], [15, 1, 1, "", "step"], [15, 3, 1, "", "unwrapped"], [15, 1, 1, "", "wrapper_spec"]], "gymnasium.envs.functional_jax_env": [[3, 0, 1, "", "FunctionalJaxEnv"]], "gymnasium.envs.functional_jax_env.FunctionalJaxEnv": [[3, 1, 1, "", "render"], [3, 1, 1, "", "reset"], [3, 1, 1, "", "step"]], "gymnasium.envs.registration": [[4, 0, 1, "", "EnvSpec"], [4, 0, 1, "", "WrapperSpec"], [4, 2, 1, "", "current_namespace"], [4, 4, 1, "", "find_highest_version"], [4, 4, 1, "", "get_env_id"], [4, 4, 1, "", "load_env_creator"], [4, 4, 1, "", "namespace"], [4, 4, 1, "", "parse_env_id"], [4, 2, 1, "", "registry"]], "gymnasium.experimental.functional": [[3, 0, 1, "", "FuncEnv"]], "gymnasium.experimental.functional.FuncEnv": [[3, 1, 1, "", "initial"], [3, 1, 1, "", "observation"], [3, 1, 1, "", "render_close"], [3, 1, 1, "", "render_image"], [3, 1, 1, "", "render_init"], [3, 1, 1, "", "reward"], [3, 1, 1, "", "state_info"], [3, 1, 1, "", "terminal"], [3, 1, 1, "", "transform"], [3, 1, 1, "", "transition"], [3, 1, 1, "", "transition_info"]], "gymnasium.spaces": [[7, 0, 1, "", "Box"], [6, 0, 1, "", "Dict"], [7, 0, 1, "", "Discrete"], [6, 0, 1, "", "Graph"], [7, 0, 1, "", "MultiBinary"], [7, 0, 1, "", "MultiDiscrete"], [6, 0, 1, "", "OneOf"], [6, 0, 1, "", "Sequence"], [5, 0, 1, "", "Space"], [7, 0, 1, "", "Text"], [6, 0, 1, "", "Tuple"]], "gymnasium.spaces.Box": [[7, 1, 1, "", "is_bounded"], [7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.Dict": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.Discrete": [[7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.Graph": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.MultiBinary": [[7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.MultiDiscrete": [[7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.OneOf": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.Sequence": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.Space": [[5, 1, 1, "", "contains"], [5, 3, 1, "", "dtype"], [5, 1, 1, "", "from_jsonable"], [5, 3, 1, "", "is_np_flattenable"], [5, 3, 1, "", "np_random"], [5, 1, 1, "", "sample"], [5, 1, 1, "", "seed"], [5, 3, 1, "", "shape"], [5, 1, 1, "", "to_jsonable"]], "gymnasium.spaces.Text": [[7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.Tuple": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.utils": [[8, 4, 1, "", "flatdim"], [8, 4, 1, "", "flatten"], [8, 4, 1, "", "flatten_space"], [8, 4, 1, "", "unflatten"]], "gymnasium.utils.env_checker": [[9, 4, 1, "", "check_env"]], "gymnasium.utils.ezpickle": [[9, 0, 1, "", "EzPickle"]], "gymnasium.utils.performance": [[9, 4, 1, "", "benchmark_init"], [9, 4, 1, "", "benchmark_render"], [9, 4, 1, "", "benchmark_step"]], "gymnasium.utils.play": [[9, 0, 1, "", "PlayPlot"], [9, 0, 1, "", "PlayableGame"], [9, 4, 1, "", "play"]], "gymnasium.utils.play.PlayPlot": [[9, 1, 1, "", "callback"]], "gymnasium.utils.play.PlayableGame": [[9, 1, 1, "", "process_event"]], "gymnasium.utils.save_video": [[9, 4, 1, "", "capped_cubic_video_schedule"], [9, 4, 1, "", "save_video"]], "gymnasium.utils.seeding": [[9, 4, 1, "", "np_random"]], "gymnasium.utils.step_api_compatibility": [[9, 4, 1, "", "convert_to_done_step_api"], [9, 4, 1, "", "convert_to_terminated_truncated_step_api"], [9, 4, 1, "", "step_api_compatibility"]], "gymnasium.vector": [[11, 0, 1, "", "AsyncVectorEnv"], [12, 0, 1, "", "SyncVectorEnv"], [14, 0, 1, "", "VectorActionWrapper"], [10, 0, 1, "", "VectorEnv"], [14, 0, 1, "", "VectorObservationWrapper"], [14, 0, 1, "", "VectorRewardWrapper"], [14, 0, 1, "", "VectorWrapper"]], "gymnasium.vector.AsyncVectorEnv": [[11, 1, 1, "", "call"], [11, 1, 1, "", "close"], [11, 1, 1, "", "get_attr"], [11, 3, 1, "", "np_random"], [11, 3, 1, "", "np_random_seed"], [11, 1, 1, "", "reset"], [11, 1, 1, "", "set_attr"], [11, 1, 1, "", "step"]], "gymnasium.vector.SyncVectorEnv": [[12, 1, 1, "", "call"], [12, 1, 1, "", "close"], [12, 1, 1, "", "get_attr"], [12, 3, 1, "", "np_random"], [12, 3, 1, "", "np_random_seed"], [12, 1, 1, "", "reset"], [12, 1, 1, "", "set_attr"], [12, 1, 1, "", "step"]], "gymnasium.vector.VectorActionWrapper": [[14, 1, 1, "", "actions"]], "gymnasium.vector.VectorEnv": [[10, 2, 1, "", "action_space"], [10, 1, 1, "", "close"], [10, 2, 1, "", "closed"], [10, 2, 1, "", "metadata"], [10, 3, 1, "", "np_random"], [10, 3, 1, "", "np_random_seed"], [10, 2, 1, "", "num_envs"], [10, 2, 1, "", "observation_space"], [10, 1, 1, "", "render"], [10, 2, 1, "", "render_mode"], [10, 1, 1, "", "reset"], [10, 2, 1, "", "single_action_space"], [10, 2, 1, "", "single_observation_space"], [10, 2, 1, "", "spec"], [10, 1, 1, "", "step"], [10, 3, 1, "", "unwrapped"]], "gymnasium.vector.VectorObservationWrapper": [[14, 1, 1, "", "observations"]], "gymnasium.vector.VectorRewardWrapper": [[14, 1, 1, "", "rewards"]], "gymnasium.vector.VectorWrapper": [[14, 1, 1, "", "close"], [14, 1, 1, "", "render"], [14, 1, 1, "", "reset"], [14, 1, 1, "", "step"]], "gymnasium.vector.utils": [[13, 4, 1, "", "CloudpickleWrapper"], [13, 4, 1, "", "batch_space"], [13, 4, 1, "", "clear_mpi_env_vars"], [13, 4, 1, "", "concatenate"], [13, 4, 1, "", "create_empty_array"], [13, 4, 1, "", "create_shared_memory"], [13, 4, 1, "", "iterate"], [13, 4, 1, "", "read_from_shared_memory"], [13, 4, 1, "", "write_to_shared_memory"]], "gymnasium.wrappers": [[18, 0, 1, "", "AddRenderObservation"], [17, 0, 1, "", "ArrayConversion"], [17, 0, 1, "", "AtariPreprocessing"], [17, 0, 1, "", "Autoreset"], [16, 0, 1, "", "ClipAction"], [19, 0, 1, "", "ClipReward"], [18, 0, 1, "", "DelayObservation"], [18, 0, 1, "", "DtypeObservation"], [18, 0, 1, "", "FilterObservation"], [18, 0, 1, "", "FlattenObservation"], [18, 0, 1, "", "FrameStackObservation"], [18, 0, 1, "", "GrayscaleObservation"], [17, 0, 1, "", "HumanRendering"], [17, 0, 1, "", "JaxToNumpy"], [17, 0, 1, "", "JaxToTorch"], [18, 0, 1, "", "MaxAndSkipObservation"], [18, 0, 1, "", "NormalizeObservation"], [19, 0, 1, "", "NormalizeReward"], [17, 0, 1, "", "NumpyToTorch"], [17, 0, 1, "", "OrderEnforcing"], [17, 0, 1, "", "PassiveEnvChecker"], [17, 0, 1, "", "RecordEpisodeStatistics"], [17, 0, 1, "", "RecordVideo"], [17, 0, 1, "", "RenderCollection"], [16, 0, 1, "", "RescaleAction"], [18, 0, 1, "", "RescaleObservation"], [18, 0, 1, "", "ReshapeObservation"], [18, 0, 1, "", "ResizeObservation"], [16, 0, 1, "", "StickyAction"], [18, 0, 1, "", "TimeAwareObservation"], [17, 0, 1, "", "TimeLimit"], [16, 0, 1, "", "TransformAction"], [18, 0, 1, "", "TransformObservation"], [19, 0, 1, "", "TransformReward"]], "gymnasium.wrappers.vector": [[14, 0, 1, "", "ArrayConversion"], [14, 0, 1, "", "ClipAction"], [14, 0, 1, "", "ClipReward"], [14, 0, 1, "", "DictInfoToList"], [14, 0, 1, "", "DtypeObservation"], [14, 0, 1, "", "FilterObservation"], [14, 0, 1, "", "FlattenObservation"], [14, 0, 1, "", "GrayscaleObservation"], [14, 0, 1, "", "JaxToNumpy"], [14, 0, 1, "", "JaxToTorch"], [14, 0, 1, "", "NormalizeObservation"], [14, 0, 1, "", "NormalizeReward"], [14, 0, 1, "", "NumpyToTorch"], [14, 0, 1, "", "RecordEpisodeStatistics"], [14, 0, 1, "", "RescaleAction"], [14, 0, 1, "", "RescaleObservation"], [14, 0, 1, "", "ReshapeObservation"], [14, 0, 1, "", "ResizeObservation"], [14, 0, 1, "", "TransformAction"], [14, 0, 1, "", "TransformObservation"], [14, 0, 1, "", "TransformReward"], [14, 0, 1, "", "VectorizeTransformAction"], [14, 0, 1, "", "VectorizeTransformObservation"], [14, 0, 1, "", "VectorizeTransformReward"]]}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "method", "Python method"], "2": ["py", "attribute", "Python attribute"], "3": ["py", "property", "Python property"], "4": ["py", "function", "Python function"], "5": ["py", "module", "Python module"]}, "objtypes": {"0": "py:class", "1": "py:method", "2": "py:attribute", "3": "py:property", "4": "py:function", "5": "py:module"}, "terms": {"": [1, 2, 3, 5, 6, 7, 9, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 162, 164, 166, 167, 168, 170, 174, 175, 177, 178], "0": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 158, 159, 162, 164, 166, 167, 168, 174, 175, 177, 178], "00": [2, 10, 18], "000": 164, "00000000e": [10, 18], "00048403": 14, "000635": [10, 14], "00080468": 14, "0008876301247721108": 19, "001": [133, 135, 140, 164, 174, 178], "00105192": 14, "00127": 14, "00133522": 14, "00142543": 14, "0015": 134, "002": [18, 139, 147, 170], "00209899": 14, "00214607": 11, "0025": [133, 134], "00266526": 14, "003": 140, "00372536": 14, "00395268": 14, "005": [144, 145, 178], "00529102": 14, "00545912": 14, "0059888": 18, "00611216": [10, 18], "00614867": 14, "00615723": 14, "00624371": 14, "00708": 6, "00711833": 6, "00715587": 14, "007812": 14, "008": [139, 147], "00848456": 10, "00942293": 10, "00987654": 158, "01": [2, 10, 14, 16, 18, 129, 137, 138, 141, 142, 143, 144, 145, 146, 155, 156, 159, 164, 170, 174, 178], "010162116476634746": 19, "01098382": [10, 14], "01162461": 10, "01234567": 158, "0123456789": 7, "0123456789abcdefghijklmnopqrstuvwxyzabcdefghijklmnopqrstuvwxyz": 7, "01431748": 10, "01456789": 158, "015": 140, "01522993": 10, "01734283": [10, 16], "01823519": [10, 14, 16, 18], "0197368": [10, 18], "02": [10, 18, 145, 155, 156, 164], "0203607": 16, "0219676": 14, "02345678": 158, "02418869": 10, "024251968": 14, "02438": 178, "02480598": [10, 14], "02727336": [10, 18], "02728892": 16, "0273956": [10, 18], "02796401": [10, 14, 16, 18], "02852531": [10, 14], "02858594": [10, 14], "02859527": [10, 16], "029028230434438706": 14, "02909703": 10, "03": [14, 129, 155, 156], "03156282": [10, 14, 16, 18], "03203924": [10, 14], "0333221090036294": 14, "03332211": 14, "03359492141887935": 14, "03392126": 10, "03516225": 10, "03517495": [10, 14], "03525399": 16, "03585979": [10, 18], "03625453": [10, 18], "03647037": 132, "03774345": 10, "03812904": 16, "03822722": 10, "04": [14, 16, 146, 155], "0446179": [10, 14, 16, 18], "04562247": 10, "0469136": [10, 14], "0469184": 10, "04731862": 10, "04740972": 10, "04794393": 16, "04799704": 10, "05": [14, 132, 137, 138, 141, 144, 155, 156, 164, 170], "055928": 14, "05592803": 132, "06": [155, 156], "06296527": 14, "06296527291998574": 14, "0631256": 14, "06312564": 132, "0640786": 14, "06540678": 18, "06670535": 16, "07": [133, 134, 155, 156], "07287608": 131, "07422512": 18, "08": [155, 156], "0808398": 11, "08227695": 18, "0892358": [14, 132], "09": [155, 156], "09417735": 13, "09613613": 18, "0_": [137, 138, 142, 144], "0_2": [144, 145], "0_3": 144, "0a2": 132, "0th": 17, "0x7f04efcb8850": 158, "0x7fbb5efd0490": 15, "1": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159, 162, 164, 166, 167, 168, 174, 175, 177, 178], "10": [6, 7, 14, 17, 18, 127, 129, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 150, 151, 152, 154, 155, 156, 158, 159, 161, 162, 164, 166, 174, 177, 178], "100": [6, 8, 14, 17, 127, 128, 129, 131, 134, 139, 144, 148, 151, 152, 153, 162, 164, 170], "1000": [9, 17, 128, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 157, 162, 164, 170, 177, 178], "1006": 156, "1009": 156, "100_000": [164, 174], "1013": 156, "10172354684460168": 14, "10172355": 14, "1018": 156, "1019": 156, "1027": 156, "1033": 156, "105": [137, 156], "107": 137, "1075": 156, "1086": 156, "1087": 156, "1094": 156, "1095": 156, "10_000": 162, "10th": 161, "10x": 174, "11": [14, 137, 138, 139, 140, 141, 144, 147, 150, 151, 152, 155, 174, 178], "110": 156, "1105": 156, "1107": 156, "1109": 156, "11185605": 131, "1119": 156, "112": 156, "1120": 156, "11448676": 14, "117": 156, "12": [8, 16, 17, 18, 129, 131, 132, 137, 138, 139, 140, 141, 144, 147, 151, 152, 156, 164, 174, 178], "120": 178, "12224312": [11, 12], "1229": 156, "123": [2, 6, 10, 11, 14, 16, 17, 18, 19, 131, 132, 133, 134, 135, 156, 161, 175], "1230": 156, "124": 156, "1240": 156, "1243": 156, "125": 156, "1250": 156, "1253": 156, "125637": 6, "1260": 156, "12625128": 131, "1264": 156, "1271": 156, "128": 178, "1280": 136, "1283": 156, "1285": 156, "1288": 156, "1289": 156, "1291": 156, "1293": 156, "1294": 156, "1297": 156, "1299": 156, "13": [137, 138, 140, 141, 144, 147, 154, 155, 156], "130": [140, 141, 156], "1304": 156, "1306": 156, "1308": 156, "1310": 156, "1312": 156, "1315": 156, "1319": 156, "132": [151, 152, 156], "1328": 156, "1329": 156, "1333": 156, "1334": 156, "136": 156, "1361": 156, "1378": 156, "138": 156, "1387": 156, "139": 156, "1393": 156, "1396": 156, "14": [137, 138, 140, 141, 144, 147, 155, 156, 174], "141": 156, "1415927": 127, "143": 156, "145": 137, "1455": 17, "146": 156, "14995256": [11, 12], "15": [8, 16, 17, 18, 19, 129, 137, 138, 140, 141, 144, 147, 153, 162, 175, 178], "150": 9, "1500": 155, "1506": 178, "15089367": [10, 16], "1511158": 18, "155": 156, "1598639586606745": 14, "16": [135, 137, 138, 140, 141, 144, 147, 153, 155, 156, 174, 177], "160": 156, "1600": 127, "1613": 154, "164": 156, "16717631": 10, "17": [137, 138, 140, 141, 144, 147, 150, 155], "17032": 156, "171": 156, "1710671": 10, "172": 156, "173": 156, "174": 156, "17752565": 131, "178": 156, "179": 156, "18": [18, 137, 138, 140, 141, 144, 147, 155], "1800": 175, "183": 156, "184": 156, "1851753": 11, "186": 156, "1878752": 12, "18847767": 10, "18879032e": [10, 18], "1887903e": 2, "18933342": 6, "19": [137, 140, 141, 144, 178], "190": 156, "19049619": 6, "1938739": 14, "195": [156, 170], "19559774": 10, "199": 9, "1990": [133, 134], "1995": 131, "1996": 131, "1_": 145, "1b15": 155, "1d": [158, 159, 177], "1e": [14, 18, 19, 139, 140, 141, 146, 147, 177], "1f": 162, "2": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 158, 159, 162, 164, 166, 167, 168, 174, 175, 177, 178], "20": [129, 137, 140, 141, 144, 154, 156, 174, 175, 178], "200": [9, 17, 129, 131, 132, 133, 135, 153, 154, 156, 162], "2000": [9, 127, 154, 175], "2004": 177, "200th": 17, "2014": 128, "2016": 178, "2017": 155, "20172954": 18, "2018": [16, 17, 131, 155], "2019": 155, "2020": [148, 150, 151, 152], "2021": [136, 148, 155], "2022": [136, 155, 156], "2023": 156, "2024": 156, "2025": 156, "205": 156, "206": 156, "208": 156, "20946532": 14, "2095": 132, "21": [18, 19, 137, 140, 141, 144, 150, 156, 164, 174, 178], "210x180": 17, "215": 156, "216": 156, "21649833": 6, "218": 156, "219": 156, "21944423": 14, "22": [17, 137, 140, 141, 144, 156, 174], "220": 174, "221": 156, "223": 156, "224": 156, "225": 156, "227": 154, "229": 177, "23": [137, 140, 141, 144, 156, 162], "230": 156, "234": 156, "235": 156, "235794": 6, "2359734": 14, "238": 156, "24": [14, 17, 18, 127, 128, 129, 132, 137, 140, 141, 156, 174], "24002443": 10, "2407": 156, "241": 156, "244": 156, "24503504": 14, "2456": 155, "246": 156, "247": 156, "2487226": 10, "249": 156, "25": [2, 8, 10, 17, 19, 137, 139, 140, 141, 147, 154, 156, 162, 170], "250": [156, 162], "250th": 162, "252": 156, "2524": 155, "254": 156, "255": [17, 18, 128, 156, 166], "25533703": 18, "256": 177, "257": 156, "25715804": 10, "258": 156, "259": 156, "25g": 137, "26": [2, 17, 137, 140, 141, 160, 167, 177], "26141977": 10, "264": 156, "264d": 170, "267": 156, "2671": 155, "2678": 155, "268": 156, "2684": 155, "27": [9, 19, 140, 141], "270": 156, "272": 156, "2736044": 135, "274": [131, 156], "274334": 131, "27648": [14, 18, 158], "277": 156, "278": 156, "27800309628058434": 14, "279": 156, "28": [14, 131, 140, 141], "281": 156, "282": 156, "2831855": 129, "284": 156, "29": [17, 140, 141, 155, 162], "2906": 155, "292": 156, "2d": [136, 145, 148, 159, 168], "2f": 162, "2gb": 155, "3": [2, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159, 160, 162, 164, 166, 174, 175, 177, 178], "30": [2, 9, 17, 140, 141, 154, 156], "300": [127, 154, 159, 166, 175], "3000": 9, "3016": 155, "303": 154, "3034542e": 14, "3036": 155, "3037": 155, "304": 156, "3040": 155, "3041": 155, "3044": 155, "3072": 155, "30759571": 170, "3076": 155, "3080": 155, "3083": 155, "31": [140, 141, 156], "3110827": 10, "3118435e": 14, "3152": 19, "3154": 19, "32": [18, 140, 141, 150, 177, 178], "321": 156, "323": [144, 156], "32351476": 18, "327": [137, 156], "329": 156, "33": [140, 141], "330": 156, "331": 156, "3319138": 10, "332": 156, "33293587": [10, 16], "333": 156, "337": 156, "338": 156, "339": 156, "34": [140, 141], "340": 156, "341": 156, "342": 156, "34641072": 16, "34756234": 16, "348": [140, 141], "35": [140, 141, 156], "350": [140, 141], "355": 156, "36": [6, 140, 141, 151, 152], "37": [140, 141, 156], "373": 156, "38": [140, 141], "39": [140, 141, 156], "3991573": 6, "3d": [136, 137, 140, 141, 148, 159, 174], "3f": 164, "3rd": 136, "3v3": 148, "4": [2, 6, 7, 8, 9, 10, 14, 16, 17, 18, 127, 128, 129, 131, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 156, 158, 159, 162, 164, 166, 168, 174, 177], "40": [140, 141], "400": [18, 154], "403": 156, "404": [154, 156], "405": 156, "407": 156, "41": [140, 141, 156], "4123625": 135, "418": [132, 156, 158], "41887903": [10, 18, 132], "4189": 6, "42": [6, 7, 10, 11, 12, 13, 16, 18, 140, 141, 156, 157, 159, 161, 164, 178], "424": 156, "42683297": 14, "42884544": 14, "429": 156, "43": [140, 141, 164], "433": 156, "435": 156, "4351738": 14, "4354835e": 14, "43887845": 13, "44": [6, 140, 141], "440": 156, "444": 156, "44504836": 14, "44799727": 14, "4488689e": 14, "45": [134, 144, 164], "450": 156, "451": 156, "459": 156, "4624777": 14, "46352962": [14, 133], "46515748": 14, "46543318": 14, "46546045": 14, "46553135": 14, "47": [151, 152], "47037": 6, "47377947": 14, "474": 156, "47599354": 14, "47de": 170, "48": [151, 152, 164], "480": 136, "4808415e": 16, "482": 156, "48468155": 14, "48657528": 14, "487": 156, "49": 164, "491": 156, "495": 156, "497": 156, "498371": 14, "4x12": [151, 152], "4x4": 153, "4\u03c0": 131, "5": [6, 7, 8, 9, 10, 13, 14, 16, 17, 18, 19, 127, 128, 129, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 154, 159, 164, 166, 174, 175, 177, 178], "50": [17, 129, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 164, 177], "500": [17, 18, 131, 132, 154, 155, 158, 162, 164, 174, 178], "503": 156, "51": [6, 156], "510": 156, "512": [156, 166], "515": 156, "516": 156, "518": 156, "520": 156, "522": 156, "524": 156, "525": 156, "5281": 156, "529": 156, "533": 156, "5342437e": 14, "535": 156, "536": 156, "538": 156, "54": 6, "540": 156, "5420062": 16, "548": 156, "55": [6, 156], "553": 156, "554": 156, "557": 156, "558": 156, "561": 156, "5635296": 134, "564": 156, "566371": 131, "567": 131, "5676788": 18, "569": 156, "57": 178, "572": 156, "573": 156, "576": 156, "5760367": [11, 12], "58": 156, "580": 156, "581": 156, "583": 156, "5836242": 6, "588": 156, "589": 156, "590": 156, "594091": 6, "5e": [137, 139, 140, 141, 147, 170], "5e3": 177, "5gb": 155, "5x": 156, "5x5": [154, 159], "6": [8, 14, 16, 17, 18, 129, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 151, 152, 154, 156, 162, 177], "60": [8, 156], "600": [18, 178], "604": 156, "608": 156, "61": 156, "6102389": 12, "612": 156, "6120394": 18, "616": 156, "6193494": 11, "62": [6, 11, 12], "62259156": 14, "63": [6, 7], "63214064": 6, "634": 156, "6343064e": 14, "6344974": 16, "635": 156, "6382770e": 16, "639": 154, "6397772e": 16, "64": [6, 156], "6608303": 16, "666": 129, "669": 6, "67": 162, "6822636": 6, "683": 156, "68512": 6, "695": 156, "697368": 13, "6fn5ja9uzquzxgkvpwtqjz1eyjcs3hj3": 170, "7": [7, 9, 129, 134, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 156, 170, 178], "70": 156, "708": 156, "709": 156, "714599": 11, "7183299": 18, "72": 156, "720": 136, "7257502": 6, "729": 9, "73": 156, "731": 156, "732": 128, "74": 156, "748": 156, "75": [16, 137, 170], "75cm": 137, "76": 162, "7619033": 14, "762": 156, "7695615": 12, "77": 6, "77395606": 13, "774": 156, "78": [137, 140, 141, 156, 162], "7851154": 11, "788": 156, "789": 156, "791": 156, "79221743": 12, "8": [6, 9, 10, 14, 18, 19, 128, 129, 131, 132, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 153, 155, 156, 158, 159, 175, 177, 178], "80": [153, 154], "800": [156, 175], "8000": 1, "80000019": [10, 18], "80000019e": [10, 18], "8000002e": 2, "801": 156, "81": [11, 12, 135, 156], "810": 156, "811": 156, "812": 156, "8127025": 156, "8127026": 156, "817": 156, "8174238": [11, 12], "81882": 6, "827": 156, "83": 156, "830": 156, "83506": 6, "838": 156, "84": [6, 17], "8498053": 12, "84x84": 17, "85859793": 13, "867": 156, "886": 156, "889": 156, "88g": 137, "89": [6, 156], "8914354": 18, "89235795": 135, "893": 156, "89345848": 14, "8934584807363618": 14, "8971417e": 14, "898": 156, "8f1d43620bc6bb580df6e80b0dc05c48": 131, "8gb": 155, "8x8": 153, "9": [11, 12, 14, 16, 131, 135, 137, 138, 139, 140, 141, 142, 144, 145, 147, 156, 174, 178], "90": 174, "9053838": 6, "9061728": 14, "90849805": 14, "910": 137, "91101986": 135, "91244936": [11, 12], "915": 156, "91g": 137, "9216": 14, "924": 156, "926": [128, 156], "928024": 6, "9296501": 14, "932": 156, "934": 156, "9375233e": 14, "9380709": 16, "941": 156, "9416149": 14, "9428282": 14, "9429494": 14, "95": [128, 164, 174, 175, 178], "9503881": 14, "950912": 6, "952": 156, "9532328e": 14, "956": 156, "957": 156, "958": 156, "959": 156, "96": [14, 18, 128, 158], "9635296": 14, "96495728": 11, "965": 156, "96562607": 12, "96x96": [128, 158], "97562236": 13, "977": 156, "978": 156, "97854": 6, "979": 156, "9808417e": 16, "982": 156, "98219293": 12, "98270553": 11, "9841162": 131, "9886932": [11, 12], "9898634e": 14, "99": [14, 19, 177, 178], "9944268": 18, "997341": 131, "999": [134, 178], "99902063": 12, "9999": 129, "9\u03c0": 131, "A": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 14, 16, 17, 18, 19, 20, 127, 128, 131, 132, 134, 136, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 150, 151, 152, 153, 155, 156, 158, 159, 160, 166, 167, 168, 174, 177, 178], "AND": 161, "And": [166, 170], "As": [2, 5, 10, 15, 17, 131, 132, 136, 149, 151, 152, 155, 156, 158, 159, 163, 168, 175, 177, 178], "At": [14, 17, 158], "Be": 156, "But": [137, 164], "By": [2, 4, 10, 17, 18, 131, 137, 138, 139, 140, 141, 146, 147, 148], "For": [2, 3, 5, 7, 8, 9, 10, 17, 18, 19, 128, 129, 136, 151, 152, 153, 154, 155, 156, 158, 159, 160, 161, 162, 163, 164, 166, 168, 170, 174, 178], "If": [1, 2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 128, 129, 132, 134, 137, 139, 140, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 160, 161, 166, 168, 170, 172, 174, 175, 178], "In": [2, 7, 9, 13, 15, 16, 19, 128, 129, 130, 131, 132, 137, 138, 139, 140, 141, 145, 146, 147, 154, 155, 156, 158, 159, 162, 163, 166, 167, 168, 170, 174, 175, 177, 178], "It": [2, 4, 6, 7, 9, 10, 11, 12, 16, 17, 127, 136, 137, 140, 141, 144, 145, 146, 148, 155, 156, 158, 159, 162, 163, 164, 166, 174, 177], "Its": 148, "No": [16, 17, 18, 150, 155, 159, 161, 177], "Not": [17, 155, 159], "OR": 161, "On": [131, 132, 133, 134, 135, 155, 156, 159, 175], "One": [7, 137, 140, 141, 156, 158, 159], "Or": [154, 161], "Such": [15, 168], "That": [3, 132, 158, 164], "The": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 162, 165, 166, 167, 169, 170, 171, 172, 173, 174, 176, 177, 178], "Then": [1, 15, 159, 161, 166, 168], "There": [7, 15, 127, 129, 130, 133, 134, 136, 140, 142, 148, 151, 152, 154, 155, 156, 166], "These": [9, 126, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 161, 174, 177], "To": [1, 2, 4, 9, 10, 13, 15, 17, 18, 127, 128, 129, 131, 132, 144, 154, 155, 156, 158, 160, 166, 168, 170, 174, 175, 177, 178], "Will": [9, 17, 20, 156], "With": [6, 14, 17, 148, 151, 152, 156, 164, 174, 175, 178], "_": [9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 128, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 157, 161, 164, 168, 170, 175, 178], "_2": [137, 138, 139, 140, 141, 144, 145, 146, 147], "__all__": 156, "__class__": 178, "__del__": 156, "__eq__": 155, "__future__": [174, 177, 178], "__get_attr__": 156, "__getattr__": 156, "__getitem__": 155, "__init__": [2, 9, 14, 15, 16, 18, 156, 164, 166, 168, 174, 175, 177, 178], "__len__": 155, "__main__": 178, "__name__": 178, "__setitem__": 155, "_action": 141, "_action_to_direct": [159, 166], "_agent_loc": [159, 166], "_async_work": 11, "_bigint_from_byt": 155, "_build": 1, "_control": 141, "_cost": [140, 141], "_dtypedict": 5, "_episod": [14, 17], "_final_info": 14, "_final_observ": 14, "_get_info": [159, 166], "_get_ob": [159, 166], "_int_list_from_bigint": 155, "_k": 14, "_modul": 18, "_nois": [137, 138, 139, 140, 141, 142, 143, 146, 147], "_np_random": [2, 5, 10, 155], "_np_random_se": [2, 10], "_rang": [140, 141], "_render_fram": 166, "_replac": 175, "_reward_ctrl": 14, "_reward_run": 14, "_scale": [137, 138, 139, 140, 141, 142, 143, 146, 147], "_script": 1, "_static": 1, "_step_mujoco_simul": 156, "_supportsdtyp": 5, "_target_loc": [159, 166], "_timelimit": 155, "_update_running_mean": [14, 19], "_worker": 11, "_x_posit": 14, "_x_veloc": 14, "a2c": [156, 171, 176], "a3c": 178, "a_": [167, 178], "a_0": 6, "a_i": 6, "a_max": 178, "a_min": 178, "a_n": 6, "a_t": 167, "aaronwalsman": 156, "ab": [128, 156, 178], "abbeel": [137, 178], "abdomen": [140, 141], "abdomen_i": [140, 141], "abdomen_x": [140, 141], "abdomen_z": [140, 141], "abil": [156, 158, 163], "abl": [156, 167], "abouelsaadat": 156, "about": [2, 3, 9, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 156, 158, 161, 162, 163, 166, 167, 174, 177], "abov": [2, 6, 7, 9, 131, 132, 135, 136, 156, 158, 160, 162, 177, 178], "absolut": [141, 143, 147, 170], "abstract": [156, 166], "ac": [150, 164, 174], "academ": 163, "academia": 156, "acceler": [128, 133, 134, 135, 148, 155, 156, 178], "accent_r": 174, "accept": [2, 5, 7, 9, 17, 155, 156, 166, 170], "access": [14, 15, 17, 148, 155, 156, 158, 161, 162, 168], "accid": 155, "accident": [155, 156], "accord": [4, 5, 6, 7, 129, 170, 178], "accordingli": 166, "account": [148, 155, 156, 175], "accur": [136, 156, 164], "accuraci": 136, "achiev": [2, 131, 150, 155, 158, 163, 170, 178], "acquir": 136, "acrobot": [130, 155], "acrobotenv": 131, "acronym": 177, "across": [13, 156], "act": [14, 156, 158, 163, 164, 168, 174], "action": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 15, 17, 20, 130, 136, 148, 149, 155, 156, 157, 161, 162, 166, 168, 170, 175, 177, 178], "action_log_prob": 178, "action_logit": 178, "action_logits_vec": 178, "action_mask": 154, "action_mean": 177, "action_pd": 178, "action_s": 175, "action_shap": 178, "action_spac": [2, 5, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 154, 156, 157, 158, 159, 161, 162, 164, 166, 168, 170, 174, 175, 177], "action_space_dim": 177, "action_stddev": 177, "action_valu": 174, "actionwrapp": [14, 15, 16], "actor": 177, "actor_lay": 178, "actor_loss": 178, "actor_losses_moving_averag": 178, "actor_lr": 178, "actor_optim": 178, "actor_weight": 178, "actor_weights_path": 178, "acttyp": [2, 3, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 156], "actual": [137, 154, 156, 158, 159, 162, 164, 166, 175, 178], "actuat": [131, 132, 140, 141, 156, 170], "acycl": 148, "ad": [14, 16, 17, 18, 19, 129, 132, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 154, 155, 156, 158, 161, 166], "adamw": 177, "adapt": [132, 142, 143, 148, 151, 152, 162], "add": [1, 4, 5, 9, 11, 16, 17, 18, 19, 20, 128, 136, 137, 140, 141, 151, 152, 154, 155, 156, 158, 162, 164, 166, 168, 174, 178], "add_mark": 156, "add_subplot": 174, "addit": [2, 5, 129, 130, 148, 150, 154, 155, 156, 158, 159, 162, 164, 166, 170, 174, 177, 178], "addition": [148, 155, 156, 160], "additional_wrapp": [4, 156], "addrenderobserv": [18, 20, 156], "address": 156, "addwhitenois": 156, "adilzouitin": 155, "adjac": 6, "adjust": [148, 170], "advanc": [11, 131, 148, 156, 162], "advantag": [137, 156, 166], "advis": 14, "affect": [6, 156, 159], "affin": [14, 16, 18, 20, 129], "after": [2, 3, 5, 9, 10, 17, 129, 137, 138, 139, 140, 141, 144, 145, 146, 147, 150, 154, 155, 156, 158, 161, 162, 164, 166, 167, 174, 177, 178], "again": [2, 129, 154, 166], "against": [148, 155], "agent": [2, 4, 5, 14, 17, 20, 127, 128, 129, 133, 137, 138, 139, 140, 141, 142, 143, 145, 146, 147, 148, 155, 156, 159, 161, 163, 166, 167, 168, 175], "agent_i": 159, "agent_posit": 168, "agent_x": 159, "agnost": [137, 138, 139, 140, 141, 146, 147], "ago": 156, "ahead": 155, "ahmedo42": 155, "ai": 148, "aim": [136, 139, 146, 147, 155, 156, 165, 169, 171, 173, 176, 177], "air": [144, 148, 156], "al": [4, 16, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 155, 156, 161, 174], "ale_pi": [17, 156, 161], "alexdluken": 156, "algorithm": [2, 5, 10, 148, 149, 154, 155, 156, 158, 159, 161, 162, 164, 167, 170, 172, 174, 175, 177, 178], "alias": 148, "align": [154, 156, 161], "aliv": [140, 147], "alive_bonu": 142, "all": [2, 4, 5, 6, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 126, 128, 129, 130, 131, 132, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 155, 156, 158, 159, 161, 168, 170, 171, 172, 174, 175, 177, 178], "all_act": 175, "all_stat": 175, "alloc": 159, "allow": [3, 4, 5, 6, 9, 11, 12, 14, 15, 17, 18, 19, 20, 131, 132, 133, 134, 135, 140, 141, 142, 143, 147, 148, 155, 156, 158, 159, 160, 161, 166, 168, 177, 178], "almost": 155, "along": [2, 9, 10, 15, 18, 128, 132, 133, 134, 142, 143, 146, 151, 152, 155, 156, 158, 160], "alongsid": 158, "alpha": 162, "alphabet": 7, "alphanumer": 7, "alreadi": [2, 10, 15, 156, 158, 161], "alreadypendingcallerror": 11, "also": [2, 7, 9, 10, 11, 12, 17, 18, 127, 128, 129, 130, 136, 137, 143, 148, 155, 156, 158, 159, 161, 166, 167, 168, 170, 174, 175, 177, 178], "alter": [2, 15, 156, 158, 166], "altern": [1, 148, 156, 159], "although": [7, 137, 170], "altogeth": 170, "alwai": [7, 8, 17, 129, 133, 134, 137, 140, 141, 142, 145, 146, 150, 151, 152, 153, 156, 158, 164, 166], "amacati": 156, "ambigu": 161, "among": [16, 130, 136], "amount": [9, 127, 132, 142, 143, 177], "amp": 156, "amtamasi": 155, "an": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 166, 167, 168, 170, 172, 175, 178], "analog": 2, "analogi": 144, "analysi": [148, 162], "analyt": 142, "analyz": 162, "anderson": [132, 142, 143], "andrea": [156, 170, 175], "andrew": [133, 134, 156, 175], "andrewtanj": 155, "anerrupt": 156, "angl": [127, 129, 131, 132, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 158, 159], "angle_1": 137, "angle_2": 137, "angle_3": 137, "angle_4": 137, "angular": [127, 129, 131, 132, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "ani": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 20, 129, 132, 137, 139, 140, 142, 143, 146, 147, 148, 153, 155, 156, 158, 159, 166, 167, 170, 174, 175, 177], "anim": [9, 136], "ankle_1": 137, "ankle_2": 137, "ankle_3": 137, "ankle_4": 137, "annot": [155, 156, 174, 175, 177, 178], "annot_kw": 175, "annoy": 156, "anoth": [14, 15, 17, 137, 140, 141, 143, 147, 154, 155, 164, 167, 174, 177], "ansi": [2, 155, 156, 166], "ansi_list": 2, "answer": [148, 164, 166], "ant": [136, 155, 156, 170], "anymor": [14, 18, 19, 155, 156], "anyth": [148, 170, 175], "anytrad": 148, "anywher": [156, 159], "apach": 148, "apart": 166, "api": [2, 3, 14, 17, 20, 148, 155, 156, 157, 158, 165, 166, 167, 169, 170, 171, 178], "apicompat": 156, "appear": [133, 134, 158], "append": [14, 19, 156, 164, 174, 175, 177, 178], "appli": [2, 4, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 127, 129, 130, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 155, 156, 161, 166, 168, 174, 177], "applic": [5, 7, 146, 148, 158, 159, 171, 173, 176], "apply_along_axi": 174, "apply_api_compat": [4, 155, 156, 160], "apply_env_compat": 156, "appreci": 155, "approach": [142, 155, 156, 161, 166, 174, 177], "appropri": [156, 166, 170, 177], "approxim": [14, 19, 148, 164], "ar": [2, 4, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 158, 159, 160, 161, 163, 164, 166, 167, 168, 170, 172, 174, 177, 178], "araffin": 155, "arang": [174, 175, 178], "arbitrari": [2, 4, 7, 9, 148, 178], "arbitrarili": 156, "arcad": [17, 148], "archiv": 155, "archiveprefix": 156, "area": 136, "aren": 155, "arg": [9, 11, 12, 159, 164, 174, 177, 178], "argmax": [154, 164, 174, 175], "argument": [4, 5, 6, 7, 8, 9, 10, 11, 12, 14, 16, 126, 130, 149, 155, 156, 158, 160, 166, 170, 174], "ariel": 156, "arjun": [155, 156], "arm": [136, 140, 141, 144, 145, 148], "around": [3, 14, 126, 148, 155, 164], "arr": [164, 174], "arrai": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 20, 129, 131, 132, 133, 134, 135, 155, 156, 158, 159, 161, 164, 166, 168, 174, 177, 178], "arrang": 4, "array_equ": [159, 166], "arrayconvers": [14, 17, 20, 156], "arraytyp": [10, 11, 12, 14], "arrow": [7, 175], "art": 164, "artemmiyi": 156, "articl": 175, "articul": [146, 148], "artifici": 154, "arxiv": [156, 178], "as_cmap": 175, "ascii": [155, 159], "ask": 159, "aspect": [155, 158, 167], "assert": [156, 166], "assess": 2, "asset": [153, 170], "assign": [2, 132, 133, 134, 144, 145, 148, 156, 174, 175], "assist": 148, "associ": [155, 156], "assum": [7, 14, 18, 136, 156, 161, 166], "assumpt": 161, "async": [4, 11, 156], "asynchron": [5, 10, 11, 12, 156], "asyncvectorenv": [10, 156, 163, 178], "atari": [9, 17, 20, 155, 156, 158, 174], "atari_wrapp": 18, "ataripreprocess": [17, 20, 156], "attach": [129, 132, 135, 137, 142, 143, 147], "attempt": [8, 129, 136, 154, 178], "attitud": 148, "attr": 6, "attribut": [4, 6, 11, 12, 17, 18, 19, 156, 158, 166, 168], "attributeerror": 156, "audio": 156, "augment": [18, 20, 158], "author": [133, 134, 155, 156, 170, 174, 175, 177, 178], "auto": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 156], "autobuild": 1, "autom": [148, 155], "automat": [1, 2, 4, 10, 11, 12, 14, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 155, 156, 160, 161, 164, 166, 178], "automata": [148, 156], "autoreset": [4, 10, 11, 12, 17, 20, 156], "autoreset_mod": [10, 11, 12, 156], "autoresetmod": [10, 11, 12, 156], "autoresetwrapp": [17, 155, 156], "autorom": [155, 156], "aux_1": 137, "aux_2": 137, "aux_3": 137, "aux_4": 137, "auxiliari": [2, 159, 166], "avail": [4, 10, 129, 148, 150, 151, 152, 155, 156, 159, 161, 162, 166, 170, 172], "averag": [9, 14, 19, 20, 162, 164, 167, 174, 175, 177], "average_reward": 164, "avg_length": 162, "avg_rec": 162, "avg_reward": [162, 177], "aviat": 148, "avoid": [10, 13, 15, 151, 152, 154, 158, 159, 170], "awai": [137, 138, 139, 140, 144, 145, 146, 147, 154, 168, 175], "awak": 129, "awar": [148, 156], "award": 132, "ax": [5, 7, 164, 166, 174, 175, 178], "ax1": 174, "ax2": 174, "axb2035": 156, "axi": [17, 18, 133, 134, 137, 140, 141, 146, 174, 175], "ayesh": 156, "b": [1, 7, 144, 145, 154, 155], "b14c": 170, "b2dtut": 128, "b5": 7, "back": [11, 14, 15, 17, 18, 20, 126, 136, 137, 138, 156, 170], "back_leg": 137, "backend": [155, 156, 166], "background": 128, "backlog": 156, "backport": 155, "backward": [138, 155, 156, 160, 177, 178], "bad": [13, 158, 159, 164], "badia": 178, "balanc": [132, 142, 143, 158, 159, 164, 177, 178], "bali": 156, "balisujohn": [155, 156], "bandit": 148, "bar": [9, 164, 178], "bare": 15, "barto": [2, 131, 132, 142, 143, 150, 151, 152, 155, 174, 175], "base": [2, 4, 5, 9, 10, 13, 14, 15, 17, 18, 19, 20, 126, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 154, 155, 156, 158, 159, 164, 166, 168, 170, 174, 177, 178], "base_env": 15, "baselin": 148, "baselines3": [18, 172], "basemujocoenv": 156, "bash": 155, "basic": [156, 159, 161, 162, 164, 170, 172], "basicconfig": 162, "basilisk": 148, "batch": [5, 10, 11, 12, 13, 14, 155, 178], "batch_spac": [5, 13, 156], "bbox_to_anchor": 174, "beanpow": 156, "beat": [148, 150], "beatabl": 174, "becam": 155, "becaus": [136, 161, 164, 166, 168, 170, 174, 178], "becom": [126, 155, 156, 164, 167, 178], "been": [2, 9, 10, 15, 129, 137, 140, 141, 148, 155, 156, 158, 159, 161, 166, 167, 175, 178], "befor": [2, 4, 9, 10, 14, 15, 16, 17, 18, 19, 20, 128, 137, 138, 139, 140, 144, 145, 146, 147, 155, 156, 158, 161, 164, 166, 168, 170, 177, 178], "began": 156, "begin": [14, 17, 155, 158, 159, 161, 166, 174, 178], "beginn": [156, 159], "behav": [155, 162], "behavior": [14, 15, 135, 136, 137, 138, 139, 140, 141, 146, 147, 148, 155, 156, 158, 159, 161, 162, 164, 166, 168, 170], "behaviour": [129, 136, 156], "behind": [2, 137, 140, 156, 161], "being": [3, 4, 6, 7, 8, 17, 129, 133, 134, 135, 137, 140, 141, 144, 145, 155, 156, 158, 159, 164, 170, 174, 175], "believ": 156, "bellman": 164, "belong": 6, "below": [7, 10, 20, 135, 147, 156, 158, 167, 174, 178], "benchmark": [126, 148], "benchmark_init": 9, "benchmark_rend": 9, "benchmark_step": 9, "benefit": [17, 156], "bennet": 148, "besid": 136, "best": [164, 174, 175, 178], "better": [127, 155, 156, 159, 161, 164, 178], "between": [3, 6, 7, 14, 17, 18, 19, 20, 129, 131, 132, 135, 136, 137, 138, 139, 140, 141, 142, 143, 145, 146, 147, 148, 155, 156, 158, 159, 161, 164, 166, 167, 174, 175, 177, 178], "beyond": 156, "bf1797a3": 170, "bfoot": 138, "bia": [137, 138, 139, 140, 141, 146, 147, 178], "bias": [162, 178], "big": [164, 166, 175], "bigger": 175, "biggest": [161, 175], "bike": [158, 164], "binari": [5, 7, 148, 158, 166], "bind": [126, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155], "biomechan": 136, "bipe": 136, "biped": [126, 140, 141, 147, 155, 170], "bipedal_walk": 127, "bipedalwalk": [127, 155], "biplan": 148, "bird": 148, "bit": 155, "bitcraz": 148, "bkrl": 155, "black": [131, 155, 156, 174, 175], "blackjack": [149, 155, 156, 171, 176], "blackjack_q_learn": 174, "blackjackag": [164, 174], "blit": 166, "blob": [151, 152, 155, 170], "block": 156, "blog": [155, 156, 161], "blue": [131, 154, 166, 175], "blueski": 148, "board": 148, "board_gam": 155, "bodi": [129, 136, 137, 138, 139, 140, 141, 142, 144, 146, 147, 170], "boilerpl": [15, 158, 166, 168], "bonu": [147, 178], "book": [131, 150, 151, 152, 155, 174], "book_or_nip": 131, "bool": [2, 4, 5, 6, 7, 9, 10, 11, 12, 14, 15, 17, 18, 132, 136, 137, 138, 139, 140, 141, 146, 147, 164, 166, 174, 175, 177], "bool8": 156, "bool_": 156, "boolean": [2, 5, 9, 14, 17, 129, 156, 174, 177], "booster": 129, "bootstrap": [2, 161, 167, 178], "bot": 148, "both": [7, 10, 11, 12, 18, 127, 130, 131, 147, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 160, 161, 162, 163, 166, 167, 175, 177], "bother": 166, "bottom": [128, 133, 134, 139, 151, 152, 156, 159, 175], "bound": [2, 7, 14, 16, 17, 18, 19, 20, 129, 131, 132, 133, 134, 135, 155, 156, 158, 159, 167], "boundari": 8, "bounded": 5, "box": [2, 5, 6, 7, 8, 10, 11, 13, 14, 15, 16, 17, 18, 20, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 166, 168], "box2d": [127, 128, 129, 155, 156, 158], "brake": 128, "brax": [148, 156], "break": [155, 156, 161, 164, 175], "bridg": 148, "bring": 156, "britojr": 156, "brittl": 177, "broken": [17, 155], "brown": 156, "browser": 1, "bshin": 138, "bsk": 148, "bsuit": 148, "bthigh": 138, "btjanaka": 156, "buffalo": 148, "buffer": [14, 17, 128], "buffer_length": [14, 17, 162, 164, 174, 178], "bug": [17, 129, 136, 137, 139, 140, 142, 143, 144, 145, 147, 153, 155, 156, 161, 164], "build": [5, 126, 137, 138, 139, 140, 141, 142, 143, 146, 147, 148, 156, 158, 162, 166, 168], "built": [13, 148, 155, 156, 159, 163], "bullet": 148, "bump": 155, "bunch": 175, "burden": 177, "bushi": 9, "busi": 158, "bust": [150, 164, 174], "button": [5, 7, 9, 158], "c": [9, 129, 131, 156, 166, 177], "cab": 154, "calcul": [14, 18, 19, 135, 137, 142, 151, 152, 153, 154, 159, 162, 170, 178], "call": [2, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 137, 144, 145, 150, 153, 155, 156, 158, 159, 160, 161, 164, 166, 170, 174, 178], "call_async": 156, "call_wait": 156, "callabl": [3, 4, 9, 11, 12, 13, 14, 16, 17, 18, 19, 156], "callback": [9, 155], "cambridg": [133, 134], "camera": [136, 137, 138, 139, 140, 146, 147], "camera_id": 136, "camera_nam": 136, "campbel": 128, "can": [1, 2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 166, 168, 170, 175, 177, 178], "cannot": [4, 8, 13, 17, 148, 151, 152, 155, 156, 166, 167, 172], "canva": 166, "capabl": [155, 157, 162], "capped_cubic_video_schedul": [9, 17], "captur": [9, 17], "car": [126, 130, 148, 155, 158], "car_rac": [128, 155, 158], "card": [150, 164, 174], "cardin": 159, "care": [5, 148, 164], "carl": 148, "carlo": [164, 174, 177, 178], "carloslui": 155, "carrac": [9, 14, 18, 128, 155, 156, 158], "cart": [130, 142, 143, 158, 177], "cart_posit": 158, "cart_veloc": 158, "cartesian": [6, 7, 135], "cartpol": [2, 9, 10, 14, 16, 17, 18, 19, 130, 132, 136, 142, 143, 148, 155, 156, 158, 160, 161, 162, 164, 172, 177], "cartpoleenv": [17, 132, 156], "cartpolejax": 17, "cartpolevectorenv": [132, 156], "casadi": 148, "case": [2, 3, 5, 6, 7, 13, 14, 16, 128, 137, 138, 139, 140, 141, 146, 147, 154, 156, 158, 159, 161, 166, 167, 168, 170, 177, 178], "casino": [164, 174], "cast": 18, "cat": 138, "catch": [156, 159, 162], "categor": [7, 178], "categori": 1, "caught": 155, "caus": [140, 147, 154, 155, 156, 163, 164], "cbar": 174, "cc": 131, "cclauss": 155, "ccmdp": 148, "cd": 1, "cell": [148, 151, 152, 159, 166], "cellular": [148, 156], "center": [14, 18, 20, 128, 129, 132, 135, 137, 140, 141], "centr": [137, 140, 141], "central": 156, "centric": 177, "certain": [2, 143, 145, 155, 156, 174, 178], "cfrc_ext": [137, 140, 141], "chain": [15, 131, 146, 158], "challeng": [148, 164, 174], "chanc": [11, 148, 154], "chandrasekar": 177, "chang": [1, 2, 3, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 143, 146, 147, 148, 154, 155, 156, 158, 159, 160, 163, 166, 168, 170, 174, 177], "changelog": [4, 155, 156], "channel": [14, 17, 18], "charact": [7, 9], "character": 148, "charg": [6, 148], "charlist": 7, "charraut": 156, "charset": 7, "cheat": 164, "check": [1, 2, 5, 7, 15, 17, 20, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 158, 161, 164, 166, 168, 170, 174, 175], "check_env": [9, 156, 159, 161], "check_environments_match": 156, "checker": [4, 20, 155, 156], "cheetah": 136, "chess": 158, "child": 13, "children": 11, "choic": [158, 159, 175, 177, 178], "choos": [158, 164, 166, 170, 175], "choose_act": 175, "chosen": [2, 7, 151, 152, 175, 178], "chri": 128, "christofkaufmann": 156, "chrisyeh96": 156, "chunk": 17, "ci": [9, 155, 156], "cinert": [140, 141], "circl": 166, "citat": 156, "cite": 156, "civil": 148, "clamp": [140, 141], "clarifi": [155, 156], "clariti": 159, "class": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 14, 15, 17, 18, 19, 136, 148, 155, 156, 158, 159, 163, 164, 166, 168, 170, 174, 175, 177, 178], "classic": [129, 131, 132, 133, 134, 135, 139, 143, 146, 147, 148, 155, 156, 158, 167], "classic_control": [17, 155], "classif": 148, "classmethod": 15, "clean": [2, 148], "cleaner": [154, 161], "cleanup": 155, "clear": [13, 17, 156, 158, 159, 161, 162, 164], "clear_mpi_env_var": 13, "clearer": [2, 155, 162], "clearli": 5, "clementperroud": 156, "cliff": [149, 156], "cliff_walk": [151, 152], "cliffwalk": [151, 152, 155, 156], "cliffwalkingslipperi": 152, "climb": 130, "clip": [14, 16, 19, 20, 133, 134, 137, 156, 158, 159, 166, 168, 178], "clip_reward": 166, "clipact": [14, 16, 20, 158], "clipreward": [10, 14, 19, 20, 156, 168], "clobber": 155, "clock": [162, 166], "clockwis": 135, "clone": [148, 170], "close": [2, 3, 7, 9, 10, 11, 12, 14, 15, 17, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 136, 137, 139, 140, 145, 147, 155, 156, 157, 158, 161, 162, 168, 170, 174, 175, 178], "close_extra": [10, 11, 12], "closechoic": 156, "closer": [129, 150, 156, 164], "closest": 127, "cloudpickl": 13, "cloudpicklewrapp": 13, "cluster": 148, "cmap": [174, 175], "cnt": 156, "co": [131, 133, 134, 135, 142, 145, 148], "coars": 131, "code": [2, 3, 5, 6, 9, 11, 14, 15, 17, 18, 19, 131, 148, 155, 156, 162, 163, 166, 168, 170, 171, 174, 175, 177, 178], "codebas": [156, 161, 166], "coeffici": [146, 178], "coin": 7, "coincid": 166, "col": [151, 152, 153], "cola": 156, "colder": 155, "collabor": 162, "collect": [2, 10, 11, 12, 17, 20, 148, 156, 157, 162, 164, 170, 174, 178], "collector": 156, "collid": 129, "collis": [133, 134, 148, 155], "color": [2, 6, 154], "color_palett": 175, "colour": [128, 155], "column": [4, 164, 175, 177], "com": [19, 140, 141, 151, 152, 153, 155, 166, 170, 172, 175, 177], "combin": [2, 5, 9, 15, 145, 158, 159, 178], "come": [129, 137, 138, 139, 140, 146, 147, 156], "comet": 156, "command": [136, 166], "comment": [136, 155, 156, 178], "commit": [156, 166], "common": [7, 15, 18, 20, 156, 161, 162, 167, 168, 171, 173, 176, 177], "commonli": [20, 155], "commonroad": 148, "commun": [11, 155, 161, 162], "compar": [139, 140, 146, 147, 148, 161, 162, 174, 175, 178], "comparison": 162, "compartment": 156, "compat": [14, 17, 18, 20, 144, 148, 155, 156, 157, 166, 167, 168, 170, 174, 175, 177, 178], "compet": 162, "compil": [148, 155, 163], "compilergym": 148, "complement": 2, "complet": [1, 4, 11, 17, 128, 129, 156, 158, 159, 162, 164, 167, 168, 174], "complex": [5, 6, 136, 140, 141, 142, 143, 148, 156, 158, 161, 162, 163, 177, 178], "compli": 155, "complianc": 155, "compliant": [155, 160], "complic": [7, 15, 161, 168], "compon": [18, 158, 159, 161, 166], "compos": [9, 137, 138, 139, 140, 141, 143, 146, 147], "composit": 7, "compound": 8, "comprehens": [148, 155], "compris": 7, "comput": [2, 3, 9, 14, 18, 19, 20, 136, 137, 155, 156, 159, 162, 164, 166, 174, 177, 178], "computation": [148, 163], "compute_metr": 9, "concat": 175, "concaten": [5, 8, 11, 12, 13, 136, 156], "conceptu": [7, 161, 164], "concern": 177, "conda": [156, 166], "condit": [2, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 167, 170, 174, 177], "conduct": 156, "confid": 162, "config": 4, "configur": [126, 130, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 159, 161, 162, 166, 174, 178], "confirm": [131, 155], "conflict": 9, "congratul": [159, 164], "conjunct": [9, 13], "connect": [2, 6, 11, 131, 137, 138, 139, 140, 141, 145, 146, 147, 148], "connectionist": 177, "consecut": 129, "consequ": [155, 158, 164], "consid": [4, 128, 129, 130, 136, 137, 139, 140, 143, 147, 166, 168], "consist": [3, 7, 127, 129, 131, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 155, 156, 158, 159, 161, 162, 163, 164, 166, 168, 170, 174, 177], "consol": [4, 162], "consolid": 155, "constant": [3, 129, 134, 137, 140, 141, 142, 164], "constantli": 145, "constitu": 6, "constrain": 148, "constraint": [140, 141, 142, 148, 159, 161], "construct": [7, 9, 131, 137, 138, 139, 140, 141, 146, 147, 148], "constructor": [4, 9, 15, 155, 156, 158, 166], "consult": 170, "consumpt": 2, "contact": [127, 129, 136, 137, 140, 141, 142, 155], "contact_cost": [137, 140], "contact_cost_rang": 140, "contact_cost_weight": [137, 140, 170], "contact_force_rang": 137, "contain": [1, 2, 5, 8, 10, 13, 17, 18, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 166, 170, 172, 174, 177, 178], "content": 162, "context": [4, 11, 13, 148, 177], "contextu": 148, "continu": [2, 5, 9, 14, 18, 19, 128, 129, 130, 133, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 158, 159, 161, 167, 174, 177, 178], "continuous_mountaincarenv": 134, "contribut": [126, 148, 156, 172], "contributor": 156, "control": [2, 5, 7, 126, 128, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 164, 168, 170, 175, 178], "conveni": [6, 15, 158, 159, 166], "convent": [1, 2], "converg": [164, 174, 175], "convers": [3, 148, 156, 160], "convert": [1, 5, 6, 14, 17, 18, 20, 129, 148, 155, 156, 159, 160, 161, 174, 175], "convert_to_done_step_api": 9, "convert_to_terminated_truncated_step_api": [9, 160], "convolution_mod": 164, "convolv": [156, 164, 174, 178], "cool": 156, "coordin": [7, 14, 127, 129, 135, 137, 138, 139, 140, 141, 144, 145, 146, 147, 148, 159], "coordinatesof": 142, "copi": [10, 11, 12, 13, 159, 166], "copier": 166, "core": [155, 156, 158, 159, 164], "correct": [4, 9, 10, 16, 129, 148, 154, 155, 156, 158, 161, 164, 166, 167, 177], "correctli": [2, 9, 14, 18, 19, 155, 156, 166, 167], "correspond": [1, 2, 4, 7, 11, 12, 15, 18, 129, 131, 132, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 154, 166, 175, 177, 178], "correspondingli": 128, "cosin": [131, 142, 145], "cost": [127, 156], "could": [2, 9, 14, 137, 138, 139, 140, 141, 143, 146, 147, 156, 158, 159, 161, 164, 166, 167, 168, 170, 174, 175, 177, 178], "couldn": 161, "coulom": 146, "count": [7, 127, 129, 150, 164, 174], "counter": [135, 156], "coupl": 178, "cours": [148, 175], "cover": [5, 12, 174], "coverag": 148, "cpu": [129, 136, 163, 178], "craft": 129, "craftium": 148, "crash": [129, 158], "crazyfli": 148, "creat": [4, 5, 7, 9, 10, 11, 12, 13, 14, 15, 17, 127, 128, 129, 145, 148, 155, 156, 158, 161, 162, 163, 164, 168, 170, 174, 177, 178], "create_empty_arrai": [5, 13, 156], "create_grid": 174, "create_plot": 174, "create_se": 155, "create_shared_memori": [5, 13], "creation": [2, 4, 156, 161, 166], "creatur": 148, "criteria": [158, 159], "critic": [2, 17, 156], "critic_lay": 178, "critic_loss": 178, "critic_losses_moving_averag": 178, "critic_lr": 178, "critic_optim": 178, "critic_weight": 178, "critic_weights_path": 178, "cross": [151, 152, 153], "crucial": [5, 10, 158, 159, 161], "crypto": 148, "cstride": 174, "ctr_cost": 147, "ctrl_cost": [137, 138, 139, 140, 146, 147], "ctrl_cost_weight": [137, 138, 139, 140, 141, 146, 147, 170], "ctx": 13, "cube": 5, "cuda": [148, 178], "cum_reward": 175, "cumsum": 175, "cumul": [9, 14, 17, 20, 175], "cumulative_reward": 9, "cupi": [14, 17], "current": [2, 4, 7, 9, 10, 17, 18, 128, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 163, 164, 166, 174, 175, 177, 178], "current_col": [151, 152, 153], "current_namespac": 4, "current_q": 164, "current_row": [151, 152, 153], "curriculum": 155, "curv": [155, 162], "custom": [2, 5, 10, 11, 12, 14, 15, 17, 18, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 155, 156, 158, 162, 164, 169, 171], "customis": 148, "customiz": 148, "customspaceerror": 13, "cut": [161, 164], "cvel": [140, 141], "cyaneu": 153, "cylind": 144, "cython": 156, "d": [7, 9, 15, 131, 148, 159, 172, 178], "dac": 148, "dacbench": [148, 156], "daemon": 11, "dag": 148, "dai": 126, "darkgrid": 177, "data": [5, 8, 9, 10, 15, 148, 155, 156, 158, 159, 162, 163, 164, 166, 168, 174, 175, 177, 178], "data_equival": 156, "data_equivil": 156, "databas": 2, "datafram": [175, 177], "datapoint": 8, "dataset": 156, "datatyp": 155, "david": 175, "davidpl1": 156, "davidslayback": 156, "de": 156, "dead": [155, 156], "deal": [6, 178], "dealer": [150, 155, 164, 174], "dealer_card": 164, "dealer_count": 174, "debug": [2, 5, 9, 148, 149, 155, 156, 158, 161, 162, 164], "decai": [164, 174], "decay_epsilon": [164, 174], "decent": [174, 177], "decid": [150, 156, 175], "decis": [148, 155, 156, 158, 159, 164, 167], "deck": [150, 164, 174], "declar": 159, "decomposit": 154, "decreas": [129, 163, 164, 175], "deep": [148, 155, 163, 167, 172, 175, 177, 178], "deepmind": [136, 155, 170], "def": [9, 14, 156, 159, 161, 164, 166, 168, 170, 174, 175, 177, 178], "default": [2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 155, 156, 158, 159, 166, 167, 170], "default_camera_config": [136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "default_rng": 175, "defaultdict": [164, 174], "defin": [2, 3, 5, 8, 11, 12, 14, 15, 16, 17, 18, 135, 155, 156, 158, 159, 166, 167, 168, 175, 178], "definit": [137, 139, 140, 142, 155, 156, 167], "deform": 148, "deformable_gym": 148, "degre": [11, 140, 141, 142, 168, 178], "delai": [18, 20, 156, 166], "delayobserv": [18, 20, 156], "deleu": 156, "deliv": 154, "delta": [175, 177], "demand": 128, "demo": 1, "demonstr": [14, 127, 148, 162, 170, 178], "dennybritz": [151, 152], "denot": [2, 132, 153], "densiti": [144, 148, 156], "depend": [2, 6, 9, 10, 14, 18, 19, 126, 129, 130, 132, 136, 137, 138, 139, 140, 141, 146, 147, 153, 155, 156, 166, 175, 178], "dependencynotinstal": [9, 17], "deprec": [2, 136, 155, 156], "depreci": 155, "depth": 156, "depth_arrai": 136, "deque_s": [14, 17], "deriv": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 177], "derk": 148, "desc": [153, 175], "describ": [2, 5, 6, 7, 131, 132, 146, 150, 155, 156, 158, 168], "descript": [6, 20, 136, 156, 166], "design": [131, 140, 141, 148, 149, 154, 156, 164], "desir": [9, 14, 154, 159, 170, 178], "despit": 156, "destin": 154, "destroi": [129, 156], "detach": 178, "detail": [5, 6, 7, 9, 19, 131, 148, 155, 156, 158, 159, 161, 162, 164, 166, 170, 178], "detect": [156, 161, 166], "determin": [2, 17, 129, 131, 132, 133, 134, 135, 153, 155, 156, 158, 159, 166, 167, 170], "determinist": [16, 129, 131, 133, 134, 166, 178], "dev": [2, 155, 177], "develop": [136, 148, 155, 156, 161, 162, 164, 172, 177], "deviat": [146, 164, 177, 178], "devic": [14, 17, 156, 178], "devicearrai": 17, "dexter": 148, "dexteroushand": 148, "df1": 177, "di": 161, "diagnost": 2, "diagon": 159, "diagram": 135, "dict": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 18, 20, 136, 151, 152, 153, 154, 155, 156, 158, 159, 161, 166, 177], "dict_info": 14, "dict_kei": 18, "dict_time_kei": 18, "dictat": [128, 129], "dictinfotolist": [10, 14, 20, 156], "dictionari": [2, 5, 6, 7, 9, 10, 14, 18, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 159, 166, 168, 174, 177], "did": [156, 167], "didn": [156, 175], "die": 128, "dietterich": 154, "differ": [2, 5, 6, 9, 11, 12, 16, 17, 18, 128, 135, 136, 147, 148, 155, 156, 158, 159, 161, 162, 164, 166, 167, 168, 170, 171, 173, 175, 176, 178], "differenti": 167, "difficult": [132, 136, 142, 143, 156, 159, 161, 163, 164, 175], "difficulti": [155, 159], "digit": 7, "dim": [140, 141], "dimens": [5, 7, 8, 18, 148, 156, 177], "dimension": [5, 17, 129, 137, 138, 139, 146, 147, 156, 158, 159, 166, 178], "direct": [6, 131, 132, 133, 134, 137, 138, 139, 140, 142, 143, 146, 147, 148, 151, 152, 153, 154, 159, 164, 166, 175, 177], "directli": [2, 6, 10, 15, 17, 131, 136, 158, 159, 166, 174, 177], "directori": [1, 155, 166], "dirhtml": 1, "disabl": [4, 17, 18, 19, 151, 152, 153, 155, 156, 164, 170], "disable_env_check": [4, 16, 17, 155], "disable_logg": 17, "disable_print": 4, "disable_render_order_enforc": [17, 155], "disallow": 154, "disc_to_cont": 168, "discard": 18, "discord": [148, 155, 156, 161, 172], "discount": [14, 19, 161, 164, 167, 174, 175, 177, 178], "discount_factor": [164, 174], "discourag": 155, "discov": [156, 170], "discret": [2, 5, 6, 7, 8, 11, 13, 18, 128, 129, 131, 132, 133, 134, 148, 149, 150, 151, 152, 153, 154, 155, 156, 158, 159, 164, 166, 168, 174], "discrete_act": 166, "discreteact": 168, "discreteenv": 155, "discuss": [155, 156, 159], "displac": [137, 138, 139, 140, 146, 147], "displai": [2, 4, 132, 155, 161, 166], "dissect": 175, "dist": 144, "distanc": [138, 139, 141, 144, 147, 159, 166], "distance_from_origin": [137, 140], "distance_penalti": 142, "distinct": [161, 167], "distinguish": [2, 159, 161, 166, 167], "distrib": 177, "distribut": [5, 6, 7, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 155, 156, 170, 175, 177, 178], "dive": 158, "divers": [148, 157], "dlpack": 156, "do": [4, 7, 13, 15, 17, 128, 129, 131, 155, 156, 158, 159, 162, 164, 166, 168, 170, 175, 177, 178], "doc": [9, 129, 155, 156, 168], "dockerfil": 155, "docstr": [1, 155, 156], "doctest": 156, "document": [5, 7, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 130, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 155, 156, 158, 161, 166, 170, 174, 178], "doe": [2, 6, 8, 9, 10, 11, 12, 13, 15, 17, 18, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 155, 156, 159, 166, 167, 168, 178], "doesn": [1, 2, 4, 15, 17, 129, 155, 156, 159, 167, 175], "dof": [137, 140, 141], "dog": 9, "doi": [154, 156], "domain": [16, 128, 131, 133, 134, 154, 168], "domain_random": 128, "don": [6, 14, 15, 128, 133, 155, 156, 158, 159, 161, 166, 167, 175, 178], "done": [2, 9, 14, 155, 156, 158, 160, 164, 166, 167, 170, 174, 175, 177, 178], "doom": 148, "dot": [6, 7, 166], "doubl": 136, "doublependulum": 142, "down": [5, 7, 128, 141, 148, 150, 151, 152, 153, 154, 156, 159, 164, 166, 167, 174, 175], "download": [166, 167, 168, 171, 174, 175, 177, 178], "downward": 131, "dramat": [155, 156], "draw": [6, 150, 164, 166, 174], "drawn": [6, 7, 144, 146, 150, 164], "drive": 128, "driver": 156, "drone": 148, "drop": [154, 156], "drryanhuang": 156, "dry": 159, "dsctt": 155, "dstack": 174, "dt": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 170], "dtype": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 20, 129, 131, 132, 133, 134, 135, 155, 156, 159, 166, 175], "dtypeobserv": [14, 18, 20, 156], "dual": 148, "duburcqa": [155, 156], "duckietown": 148, "due": [2, 129, 132, 136, 153, 155, 156, 158, 161, 164, 167, 178], "dump": 156, "dunbar": 156, "dunder": 156, "duplic": [14, 156], "durat": [9, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 162, 177], "dure": [2, 4, 6, 7, 10, 14, 17, 18, 19, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 161, 166, 168, 170], "dw": 9, "dx": [137, 138, 139, 140, 146, 147], "dylwil3": 156, "dynam": [2, 16, 131, 135, 136, 142, 148, 155, 156, 159, 161], "e": [1, 2, 4, 5, 7, 8, 9, 11, 13, 14, 15, 17, 20, 129, 137, 138, 139, 140, 141, 143, 144, 145, 146, 147, 148, 150, 153, 155, 156, 159, 166, 168, 174, 175, 177, 178], "e3c16072f695": 170, "each": [2, 5, 6, 7, 9, 10, 11, 12, 13, 14, 16, 17, 18, 20, 126, 127, 128, 129, 130, 131, 132, 133, 134, 136, 137, 140, 141, 142, 143, 144, 145, 148, 149, 151, 152, 154, 155, 156, 158, 159, 161, 162, 164, 166, 174, 175, 178], "earli": [126, 162, 164, 174, 177], "earlier": [137, 140, 141, 166], "earliest": 177, "easi": [148, 149, 155, 158, 159, 175], "easier": [130, 155, 156, 158, 159, 178], "easiest": [128, 155, 156], "easili": [6, 10, 15, 148, 155, 156, 163], "east": 154, "ed": 131, "edg": [5, 6, 8, 132, 155, 156, 158, 159, 164], "edge_link": [6, 8], "edge_mask": 6, "edge_spac": [6, 8], "edgecolor": 174, "edit": [148, 155, 166], "educ": 162, "effect": [2, 8, 13, 15, 17, 129, 137, 141, 142, 143, 144, 145, 146, 154, 158, 159, 162, 174, 177], "effector": [144, 145], "effici": [11, 133, 134, 136, 148, 156, 159, 162, 163, 178], "effort": [130, 156], "eg": 166, "egl": 136, "eight": 137, "einforc": 177, "either": [7, 8, 9, 12, 14, 16, 17, 133, 134, 148, 150, 153, 154, 156, 158, 160, 161, 175, 177, 178], "ekalosak": [155, 156], "elaps": [14, 17], "elbow": 144, "electron": 148, "element": [2, 5, 6, 7, 10, 11, 13, 18, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 158, 166, 170, 177, 178], "elev": 170, "eleven": 136, "elf": 153, "elif": [159, 161], "elliottow": 156, "elo": 148, "els": [14, 18, 139, 147, 153, 154, 156, 159, 161, 164, 166, 174, 175, 178], "emb": 170, "embed": [162, 170], "emerg": [156, 162], "emit": 2, "emphas": 159, "emploi": 17, "empti": [5, 7, 13, 17, 137, 138, 139, 140, 141, 146, 147, 156, 159, 174, 175, 177], "emul": [155, 161], "en": [18, 177], "enabl": [4, 9, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 128, 148, 155, 156, 161], "enable_wind": [129, 178], "encapsul": 2, "encod": [8, 148, 154, 155, 166], "encompass": 148, "encount": [161, 164, 178], "encourag": [155, 159, 170, 178], "end": [2, 3, 10, 14, 17, 127, 135, 136, 155, 156, 157, 158, 159, 161, 162, 164, 167, 170, 174, 175, 177, 178], "endeavor": 148, "energi": [127, 129, 132, 159, 168], "enforc": [4, 17, 155], "engin": [129, 136, 148, 156], "english": 7, "enough": [159, 170, 178], "ensur": [1, 2, 4, 6, 8, 9, 129, 148, 156, 158, 159, 162, 164, 166, 174], "ent_coef": 178, "enter": [2, 9, 129, 151, 152], "entir": [9, 17, 139, 147, 155, 156, 178], "entiti": 5, "entrain": 148, "entri": [4, 155, 156, 159, 164], "entropi": [2, 178], "entropy_moving_averag": 178, "entry_point": [4, 155, 159, 166], "entrypoint": 166, "enum": [4, 10, 156, 166], "enumer": 175, "env": [4, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 164, 167, 168, 170, 171, 174, 175, 176, 177], "env_check": [9, 155, 156, 159, 161], "env_devic": [14, 17], "env_fn": [11, 12], "env_id": [4, 156, 160, 161], "env_lambda": 9, "env_nam": [4, 160, 162], "env_new": 9, "env_old": 9, "env_spec": 156, "env_spec_kwarg": 156, "env_typ": 1, "env_xp": [14, 17], "envapicompat": 155, "envcompat": [155, 160], "envcreat": 4, "environ": [4, 5, 7, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 127, 128, 129, 130, 131, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 149, 150, 151, 152, 153, 154, 155, 156, 157, 162, 167, 168, 169, 171, 172, 173, 176, 177], "environment_cr": 166, "environmentnam": 156, "envpool": [155, 156], "envs_wrapp": 178, "envspec": [2, 3, 4, 10, 15, 17, 156], "ep": [175, 177], "ep_action_log_prob": 178, "ep_reward": 178, "ep_value_pr": 178, "episod": [2, 4, 9, 10, 14, 17, 18, 20, 155, 156, 157, 158, 159, 161, 164, 166, 167, 170, 174, 175, 177, 178], "episode_data": 162, "episode_id": 9, "episode_index": 9, "episode_num": 162, "episode_ov": [158, 162], "episode_returns_moving_averag": 178, "episode_reward": [14, 19, 162, 164], "episode_tim": 162, "episode_trigg": [9, 17, 162], "episodestatisticsrecord": 156, "epoch": 178, "eprint": 156, "epsilon": [14, 18, 19, 164, 174, 175], "epsilon_decai": [164, 174], "epsilongreedi": 175, "equal": [11, 12, 129, 133, 134, 139, 144, 147, 150, 153, 154, 164, 175], "equat": [131, 135, 164], "equival": [4, 5, 8, 10, 14, 137, 140, 155, 156, 178], "erez": [139, 140, 141], "ericonaldo": 155, "error": [2, 4, 7, 8, 9, 11, 17, 20, 155, 156, 158, 164, 167, 174, 178], "errorr": 155, "escap": 2, "especi": [5, 161, 166, 168, 178], "essenti": [7, 162, 170], "estim": [19, 137, 161, 164, 167, 177, 178], "estimate_valu": 161, "et": [16, 17], "etc": [2, 5, 10, 14, 17, 137, 138, 139, 140, 146, 147, 155, 156, 158, 159, 161, 162, 166, 167, 168], "euclidean": [144, 145], "ev": 148, "ev2gym": 148, "eval": [162, 178], "eval_env": 161, "evalu": [14, 17, 18, 19, 148, 156, 161, 170, 174], "evanmath": 155, "even": [2, 4, 137, 139, 140, 142, 143, 147, 155, 159, 164, 166, 174], "event": [9, 155, 166], "eventu": [13, 158], "ever": [126, 155], "everi": [1, 5, 6, 9, 14, 17, 18, 19, 128, 129, 132, 137, 139, 140, 142, 143, 147, 156, 158, 159, 161, 166, 177, 178], "everyon": 136, "everyth": [17, 148, 158, 159], "evolv": 9, "exact": [150, 156, 174], "exactli": [8, 146, 158, 159, 162], "exampl": [1, 2, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 128, 131, 136, 148, 150, 151, 152, 153, 155, 156, 158, 162, 164, 166, 167, 168, 170, 171, 173, 174, 175, 176, 177, 178], "examplefuncenv": 156, "exce": [127, 150], "exceed": [2, 17, 20, 158, 174], "excel": 170, "except": [2, 7, 15, 155, 156, 159, 166], "exchang": 158, "excit": 156, "exclud": [4, 17, 20, 137, 138, 139, 140, 141, 142, 145, 146, 147, 154], "exclude_current_positions_from_observ": [137, 138, 139, 140, 141, 146, 147, 170], "exclude_namespac": 4, "exclus": [6, 136, 140, 141, 156], "execut": [1, 9, 16, 154, 158, 159, 166, 177, 178], "exhibit": 136, "exist": [2, 4, 5, 10, 11, 12, 15, 16, 17, 18, 19, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 158, 162, 163, 178], "exit": [9, 10, 11, 12], "exp": 177, "expand": [5, 7], "expect": [2, 4, 5, 6, 7, 155, 156, 158, 159, 170, 175, 177, 178], "expens": [5, 155], "experi": [17, 136, 137, 140, 141, 142, 143, 148, 158, 159, 164, 174, 175, 177, 178], "experienc": 164, "experiment": [3, 131, 156], "explain": [155, 167], "explan": [174, 177], "explanatori": 174, "explicit": [156, 161], "explicitli": [3, 166, 167, 170], "exploit": [174, 175], "explor": [2, 5, 148, 156, 159, 163, 174, 175, 178], "explor_exploit_tradeoff": 175, "exponenti": [7, 14, 19, 20], "export": 156, "expos": [3, 148, 156], "express": [5, 9, 137, 140, 141], "ext_control": 6, "extend": [2, 17, 137, 156], "extens": [148, 156, 177], "extent": 153, "extern": [2, 137, 140, 141, 155, 156, 161, 167], "extra": [155, 156, 158, 166, 174], "extract": [9, 156, 175], "extrem": [148, 149], "ez": 155, "ezpickl": [4, 9, 15], "f": [153, 158, 159, 162, 164, 174, 175, 177, 178], "f_": [137, 140, 141], "face": [137, 140, 141, 150, 164, 174], "facecolor": 174, "facedown": 150, "facilit": 136, "fact": 177, "factor": [14, 19, 129, 174, 177, 178], "factori": 4, "fail": [156, 158, 161], "failur": [158, 159, 161, 162, 167], "fair": 7, "fairli": [155, 156, 177], "fall": [127, 140, 151, 152, 153, 158, 164, 167, 170, 175], "fallen": [139, 170], "fals": [4, 6, 9, 10, 11, 12, 14, 16, 17, 18, 19, 128, 129, 132, 137, 138, 139, 140, 141, 146, 147, 150, 154, 155, 156, 158, 159, 161, 162, 164, 166, 170, 174, 175, 177, 178], "familiar": 170, "familiaris": 159, "famou": 164, "far": [127, 128, 141, 142, 144, 145, 153, 158], "farama": [10, 11, 12, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 148, 156, 166, 172, 174, 177, 178], "fast": [128, 136, 138, 140, 142, 146, 148, 158, 161, 164], "faster": [127, 129, 137, 140, 141, 142, 145, 156, 164, 178], "fastest": 158, "favor": [2, 155, 156], "favorit": 174, "favour": [2, 155, 156, 160], "featur": [6, 7, 18, 136, 155, 156, 161, 178], "feature_spac": 6, "fed": 178, "feed": 178, "feedback": [156, 158, 159, 164], "feel": [170, 177], "feet": [138, 147], "fetchreach": 161, "few": [1, 131, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 164, 170, 174, 175], "ffffffff": 153, "fffffhff": 153, "fffh": 153, "fffhffff": 153, "fffhfffg": 153, "ffoot": 138, "ffset": 177, "fhffhfhf": 153, "fhfh": 153, "fhhfffhf": 153, "fibonacci": 177, "fickl": [154, 156], "fickle_passeng": 154, "fidel": 148, "field": [156, 163], "fieteo": 155, "fig": [164, 174, 175, 178], "fig1": 174, "fig2": 174, "figaspect": 174, "fight": 148, "figsiz": [162, 164, 174, 175, 177, 178], "figur": [139, 156, 162, 174, 177], "file": [1, 131, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 162, 166, 170], "filenam": [9, 17, 162], "fill": 166, "filter": [14, 18, 20, 158], "filter_kei": [14, 18], "filterobserv": [14, 18, 20], "filterobservationwrapp": 18, "final": [3, 9, 18, 155, 156, 159, 162, 164, 166, 167, 170, 174], "final_epsilon": [164, 174], "final_info": [14, 17, 155, 156], "final_observ": [14, 17, 155, 156], "find": [2, 4, 156, 158, 162, 163, 164, 166, 170, 175], "find_highest_vers": 4, "fine": [166, 178], "finetun": 148, "finfo": 175, "fingertip": [144, 145], "finish": [2, 128, 129, 155, 156, 158, 162, 164, 166, 178], "finit": [6, 7, 137, 143, 147, 167, 168, 177], "fire": 129, "firefoxmetzg": 155, "firmwar": 148, "first": [2, 4, 6, 9, 10, 11, 12, 15, 129, 131, 133, 134, 137, 138, 139, 140, 141, 142, 145, 146, 147, 151, 152, 154, 155, 156, 157, 159, 161, 162, 164, 166, 174, 175, 177], "five": [130, 155, 164, 177], "fix": [5, 6, 7, 14, 17, 19, 20, 129, 131, 132, 135, 136, 137, 138, 139, 140, 142, 143, 144, 145, 147, 148, 150, 153, 155, 156, 158, 159, 161, 166, 177], "fixtur": 145, "flag": [11, 133, 136, 148, 161], "flake8": [155, 156], "flappi": 148, "flat": [5, 6, 7, 8, 170], "flatdim": [5, 8, 155], "flatt": 178, "flatten": [5, 8, 14, 18, 20, 136, 155, 156, 158, 159, 164, 166, 174, 175, 178], "flatten_spac": [5, 8], "flattenobserv": [6, 14, 18, 20, 158, 159, 166], "flesh": 3, "flex": 144, "flexibl": [11, 148, 156, 159], "flight": 148, "float": [4, 7, 8, 9, 14, 16, 17, 18, 19, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 159, 164, 166, 174, 175, 177, 178], "float32": [2, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 168], "float64": [5, 7, 8, 10, 14, 18, 19, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "flow": 148, "fluctuat": 164, "fluid": 146, "fly": [129, 161], "flycraft": 148, "fmt": 175, "fn": 13, "focu": [148, 159, 162, 178], "focus": [164, 172], "foddi": 148, "folder": [1, 9, 17, 156, 162], "follow": [1, 3, 4, 5, 9, 10, 14, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 129, 131, 132, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 159, 166, 167, 168, 170, 174, 175, 177, 178], "fontsiz": [174, 175], "foot": [11, 138, 139, 140, 141, 147], "foot_joint": [139, 147], "foot_left_joint": 147, "forc": [15, 129, 132, 133, 134, 136, 137, 140, 141, 142, 143, 147, 155, 170, 177], "forcibli": 167, "forearm": [140, 141, 144], "forev": 167, "foreverska": 156, "forex": 148, "forg": 166, "forget": [14, 15, 158, 166], "forgot": 159, "fork": [1, 156, 157, 161], "form": [5, 6, 7, 17, 131, 146, 156, 166], "formal": 167, "format": [1, 4, 5, 9, 14, 156, 158, 159, 161, 162, 170], "formerli": 156, "forward": [13, 19, 127, 137, 138, 139, 140, 141, 146, 147, 155, 156, 177, 178], "forward_reward": [137, 138, 139, 140, 146, 147, 170], "forward_reward_weight": [137, 138, 139, 140, 146, 147, 170], "found": [20, 136, 142, 148, 155, 156, 174, 177], "foundat": [148, 156, 166, 172], "four": [128, 129, 137, 139, 148, 154, 156, 158, 159, 174], "foxik": 155, "fp": [2, 9, 10, 17, 129, 156, 166], "frac": [137, 138, 139, 140, 141, 146, 147], "frame": [2, 9, 10, 17, 18, 20, 128, 129, 144, 145, 155, 156, 162, 175], "frame_skip": [17, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 170], "framer": 166, "frameskip": 17, "frameskipobserv": 156, "framestack": [17, 18, 155, 156], "framestackobserv": [17, 18, 20, 156], "frametim": [137, 138, 139, 140, 141, 146, 147], "framework": [14, 17, 20, 136, 148, 156, 170], "franuka": 153, "free": [131, 135, 136, 137, 140, 141, 142, 143, 148, 170, 174, 177], "free_body_rot": 146, "freedom": [140, 141, 142, 168], "freejoint": [140, 141], "freez": [14, 18, 19], "frequenc": 17, "frequent": [155, 167], "friction": [127, 146, 147, 148], "frictionless": 132, "from": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 127, 128, 129, 131, 136, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 161, 162, 163, 164, 167, 170, 174, 175, 177, 178], "from_json": [5, 156], "front": [137, 138, 146, 147], "front_left_leg": 137, "front_right_leg": 137, "frontpag": 156, "frozen": [149, 155, 156, 175], "frozen_lak": [153, 175], "frozenlak": [9, 153, 155, 156, 171, 172, 176], "frozenlake4x4": 156, "frozenlake8x8": [153, 155, 156], "frozenlake_q_learn": 175, "frozenset": 7, "fshin": 138, "fthigh": 138, "fuel": 129, "full": [3, 4, 128, 129, 155, 156, 158, 159, 174], "fulli": [2, 129, 137, 138, 139, 140, 141, 143, 146, 147, 148, 155], "fun": [174, 177], "func": [3, 14, 16, 18, 19, 156], "func_env": 3, "funcenv": [3, 156], "funcjaxenv": 156, "function": [2, 8, 10, 11, 12, 14, 16, 17, 18, 19, 20, 129, 132, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 154, 155, 156, 158, 160, 164, 167, 168, 170, 172, 174, 175, 177, 178], "functional_jax_env": 3, "functionaljaxenv": 3, "fundament": [159, 162, 164, 165, 169, 171], "furcolor": 9, "further": [2, 5, 7, 129, 144, 145, 155, 156, 175, 177], "furthermor": [2, 9, 156, 158], "furthest": 127, "futur": [3, 155, 156, 161, 164], "future_q_valu": [164, 174], "g": [1, 2, 4, 5, 7, 8, 9, 11, 12, 13, 20, 131, 135, 137, 138, 139, 140, 141, 143, 146, 147, 148, 153, 154, 155, 156, 166, 168, 174, 175, 177, 178], "ga": 128, "gae": 178, "gaetanlepag": 156, "gain": [156, 168], "galleri": [1, 156], "game": [7, 9, 17, 126, 150, 151, 152, 153, 155, 156, 158, 159, 161, 164, 166, 174], "gamma": [14, 19, 161, 167, 175, 177, 178], "gap": 148, "garbag": [10, 11, 12, 17, 156], "gather": 166, "gaussian": 136, "gc_trigger": 17, "gcc": 148, "gen_gif": 1, "gen_md": 1, "gener": [1, 2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 13, 15, 17, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 159, 162, 163, 178], "generalis": [2, 10], "generate_random_map": [153, 175], "geometr": [6, 136], "geometri": 156, "get": [2, 4, 11, 12, 14, 15, 18, 19, 127, 129, 136, 137, 139, 140, 142, 150, 155, 156, 158, 159, 162, 166, 167, 170, 174, 175, 178], "get_act": [161, 164, 174], "get_attr": [11, 12, 156], "get_env_id": 4, "get_loss": 178, "get_moving_avg": 164, "get_rect": 166, "get_stat": 155, "get_wrapper_attr": [15, 156], "gianluca": 156, "gianlucadecola": [155, 156], "giant": 164, "gif": [1, 131, 156], "git": [166, 170], "github": [19, 129, 132, 136, 137, 139, 140, 141, 142, 143, 144, 145, 147, 151, 152, 155, 156, 161, 166, 170, 172], "give": [2, 10, 129, 137, 150, 154, 155, 158, 159, 174, 177, 178], "given": [3, 4, 5, 7, 16, 127, 129, 130, 131, 132, 133, 134, 137, 139, 140, 142, 143, 147, 155, 156, 167, 174], "glfw": 136, "global": 4, "gnn": 148, "go": [2, 9, 128, 148, 150, 155, 159, 163, 164, 167, 170, 174, 177, 178], "go1": 170, "goal": [2, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 159, 161, 164, 166, 177], "goal_slidei": 144, "goal_slidex": 144, "goal_veloc": [133, 134], "godsboy404": 156, "goe": [150, 155, 164], "gone": 155, "good": [158, 159, 164, 174, 175, 178], "googl": [155, 170], "goul\u00e3o": 156, "gp": 148, "gpu": [136, 148, 156, 163, 178], "gracefulli": 155, "gradient": [177, 178], "gradual": [158, 162, 164], "grai": 17, "grammat": 156, "grant": 129, "graph": [5, 6, 8, 13, 148, 155, 156, 158, 174, 178], "graphic": [136, 155], "graphinst": [6, 8, 13, 155, 156], "grasp": 148, "grave": 178, "gravit": 129, "graviti": [129, 132, 133, 135, 142, 143, 148, 177, 178], "grayscal": [14, 17, 18, 20], "grayscale_env": 18, "grayscale_newaxi": 17, "grayscale_ob": 17, "grayscaleobserv": [14, 18, 20], "great": [148, 168, 174], "greater": [129, 131, 132, 133, 134, 143, 150, 174], "greedi": [164, 174, 175], "greedili": 174, "green": [131, 154], "grei": 174, "greyscal": 17, "grid": [148, 151, 152, 153, 154, 159, 162, 166, 174], "grid_world": 166, "gridlin": 166, "gridworld": [2, 148, 151, 152, 158, 166], "gridworldenv": [159, 166], "griesbach": 156, "grip": 174, "ground": [127, 129, 141, 148], "group": [129, 155], "grow": 162, "gt": [155, 156], "guarante": [5, 6, 13, 17, 148, 172], "guess": 155, "guid": [148, 156, 159, 170], "guidelin": 17, "guyazran": 156, "gym": [2, 5, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 126, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 156, 157, 158, 159, 161, 162, 164, 166, 167, 168, 170, 174, 175, 177, 178], "gym4real": 148, "gym_compat": 161, "gymenv": 160, "gymfc": 148, "gymlibrari": 155, "gymnasium": [2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 157, 159, 160, 161, 162, 163, 164, 167, 170, 173, 174, 175, 176, 177, 178], "gymnasium_env": [159, 166], "gymnasium_robot": [136, 156, 161], "gymnax": 148, "gymv21compat": 156, "gymv21environ": [160, 161], "gymv22compat": 156, "gymv22environ": 156, "gymv26environ": 160, "gyroscop": 128, "h": 153, "h5": 178, "ha": [1, 2, 4, 5, 7, 8, 9, 10, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 139, 140, 141, 144, 145, 146, 148, 150, 154, 155, 156, 157, 158, 159, 161, 164, 166, 167, 170, 174, 175, 177, 178], "hacki": 13, "had": [2, 155, 156], "half": 136, "half_cheetah": 138, "halfcheetah": [14, 136, 138], "halt": 167, "hand": [148, 150, 164, 177], "handl": [5, 10, 11, 12, 142, 150, 155, 156, 158, 161, 164, 169, 171, 174], "handling_time_limit": 167, "hang": [13, 131, 155], "hannah": 156, "happen": [133, 134, 137, 139, 140, 142, 143, 147, 150, 153, 154, 155, 156, 158, 159, 164, 167], "haracterist": 177, "hard": [156, 159, 161, 175], "hardcor": 127, "harden": [155, 156], "harder": [129, 170], "hardwar": [148, 155, 156], "harlei": 178, "harm": 174, "hasattr": 156, "hash_se": 155, "hasn": 161, "hasselmo": 131, "hatchl": 166, "have": [2, 4, 5, 7, 8, 10, 11, 13, 14, 15, 16, 17, 18, 126, 127, 128, 131, 137, 140, 141, 142, 143, 144, 145, 147, 150, 153, 154, 155, 156, 158, 159, 160, 161, 164, 166, 167, 168, 170, 174, 175, 177, 178], "haven": 17, "head": [11, 138, 161], "headless": [136, 155], "healthi": [137, 139, 140, 142, 143, 147], "healthy_angle_rang": [139, 147], "healthy_reward": [137, 139, 140, 142, 143, 147, 170], "healthy_state_rang": 139, "healthy_z_rang": [137, 139, 140, 147, 170], "heart": [158, 164], "heatmap": [174, 175], "height": [131, 136, 137, 139, 140, 142, 147, 155, 156, 170], "held": 150, "hello": 7, "help": [2, 4, 5, 9, 155, 156, 158, 162, 165, 169, 171, 174, 178], "helper": [155, 159], "helpingstar": 156, "henc": [137, 149, 177], "here": [3, 9, 131, 137, 140, 155, 156, 159, 162, 164, 166, 170, 178], "heurist": [127, 129, 148, 156], "hffg": 153, "hidden": [2, 177], "hidden_space1": 177, "hidden_space2": 177, "hierarch": [5, 154], "high": [2, 6, 7, 8, 11, 12, 13, 14, 18, 131, 132, 134, 135, 137, 148, 155, 156, 158, 164, 168, 170, 178], "higher": [19, 127, 144, 164, 170, 178], "highest": [4, 164], "highli": [5, 9, 126, 130, 148, 155, 166], "highwayenv": [148, 156], "hill": [133, 134], "hing": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "hinge2": 142, "hint": [155, 156], "hinter": 155, "hip": [127, 137, 140, 141], "hip_1": 137, "hip_2": 137, "hip_3": 137, "hip_4": 137, "histor": [148, 159], "histori": 136, "histplot": 175, "hit": [150, 158, 159, 164, 174], "hold": [5, 150, 174], "hole": [153, 175], "homepag": 156, "hood": 156, "hook": [155, 156], "hooper": 156, "hop": [136, 139, 147], "hope": 156, "hopefulli": [155, 174], "hopper": [15, 16, 136, 147, 156], "hopper_v4": 15, "hopperenv": 15, "horizon": [9, 139, 148, 167], "horizon_timestep": 9, "horizont": [127, 129, 131, 159, 166], "host": 156, "hot": 8, "hotter": 155, "hour": 162, "hous": 164, "how": [2, 5, 6, 9, 11, 12, 14, 141, 142, 144, 145, 148, 156, 158, 159, 161, 162, 164, 166, 167, 168, 172, 174, 178], "howardh": 156, "howev": [2, 5, 6, 7, 8, 9, 10, 11, 13, 16, 17, 131, 137, 138, 139, 140, 141, 145, 146, 147, 155, 156, 158, 166, 167, 168, 174, 178], "hpo": 172, "html": [18, 177], "http": [1, 2, 10, 11, 12, 18, 19, 128, 131, 150, 151, 152, 153, 155, 156, 166, 170, 174, 175, 177, 178], "hue": 175, "huge": [148, 155], "hull": 127, "human": [2, 6, 9, 17, 20, 128, 136, 140, 141, 144, 148, 155, 156, 157, 158, 159, 160, 161, 166, 170, 178], "humanoid": [136, 156, 170, 172], "humanoidstandup": [136, 141], "humanoidstandup_v4": 155, "humanrend": [17, 20, 156], "humnaoid": 170, "hundr": 162, "hundredth": 17, "hyperparam": 178, "hyperparamet": [162, 164, 172, 174, 175, 177, 178], "i": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 173, 174, 175, 176, 177, 178], "i_": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "ianyfan": 156, "ic": 153, "ice1187": 155, "iclr": 178, "icml": 178, "icu": 148, "id": [4, 17, 136, 137, 140, 141, 153, 156, 159, 166], "idea": [158, 167, 174], "ident": [7, 11, 12, 136, 156], "identifi": [155, 162], "idx": 175, "if__name__": 178, "iff": [9, 17, 166], "iforce2d": 128, "igibson": 148, "ignor": [1, 9, 150, 155, 161, 164, 174], "ikamensh": [155, 156], "illeg": 154, "illustr": [14, 166, 167], "im": 143, "imag": [2, 5, 10, 11, 12, 14, 17, 18, 20, 128, 136, 156, 158, 170], "imagesequenceclip": 9, "imagin": [148, 158, 168], "immedi": [9, 19, 20, 137, 139, 140, 141, 147, 150, 158, 159, 164, 166], "immut": 5, "impact": [141, 161, 175], "impact_cost": 141, "impact_cost_rang": 141, "impact_cost_weight": 141, "implement": [5, 6, 9, 10, 15, 16, 17, 20, 129, 132, 135, 142, 148, 149, 155, 156, 158, 159, 160, 161, 162, 164, 165, 166, 169, 171, 172, 173, 176, 177, 178], "implementing_custom_wrapp": 168, "implic": 161, "implicitli": 178, "import": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 164, 166, 168, 170, 175, 177, 178], "importantli": [15, 156, 158], "importerror": 156, "imposs": [159, 164], "improv": [11, 155, 156, 158, 161, 162, 163], "imshow": 175, "inaccur": 164, "includ": [2, 4, 14, 17, 18, 20, 132, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 154, 155, 156, 158, 159, 160, 162, 166, 167, 170, 172], "include_cfrc_ext_in_observ": [137, 140, 141, 170], "include_cinert_in_observ": [140, 141], "include_cvel_in_observ": [140, 141], "include_qfrc_actuator_in_observ": [140, 141], "inclus": [137, 155], "incompleteidea": [150, 151, 152], "inconsist": 161, "incorpor": 148, "incorrect": [154, 155, 156, 159, 161, 167], "incorrectli": [19, 156], "increas": [129, 131, 132, 136, 139, 144, 146, 147, 156, 163, 164, 174, 175, 178], "incur": [131, 151, 152, 154], "independ": [6, 7, 10, 129, 139, 146, 147, 156], "index": [1, 6, 9, 13, 14, 17, 18, 20, 132], "indic": [2, 9, 14, 17, 128, 131, 132, 150, 151, 152, 153, 154, 155, 164, 167, 174, 175, 177], "individu": [2, 11, 12, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 155, 159, 166, 168, 177], "indoril007": 155, "induc": [137, 138, 139, 140, 141, 146, 147], "induct": [137, 138, 139, 140, 141, 146, 147], "ineffici": [156, 163], "inelast": [133, 134], "inertia": [140, 141], "inf": [2, 10, 16, 18, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 158, 168, 170], "infam": 174, "infeas": 7, "infer": [7, 155], "infinit": [16, 17, 18, 129, 139, 150, 155, 156, 158, 159, 164, 167, 174], "info": [2, 3, 9, 10, 11, 12, 14, 17, 18, 19, 20, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 157, 158, 159, 161, 162, 164, 166, 167, 168, 170, 174, 175, 177, 178], "inform": [1, 2, 5, 6, 7, 9, 10, 11, 12, 18, 20, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 159, 161, 164, 166, 167, 170, 174, 177], "infti": [7, 139], "inher": 167, "inherit": [4, 5, 15, 16, 18, 19, 155, 156, 159, 166], "init": [128, 159, 162, 166, 178], "initi": [2, 3, 4, 6, 7, 9, 10, 14, 15, 16, 17, 18, 19, 127, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 159, 162, 164, 168, 170, 174, 175, 177, 178], "initial_epsilon": [164, 174], "initial_sampl": 156, "initialis": [2, 4, 10, 17, 150, 156, 157], "inlin": 178, "inner": 11, "inner_st": 6, "inplac": 177, "input": [9, 10, 156, 158, 159, 174, 178], "inregular": 17, "insert": [157, 177], "insid": [1, 6, 7, 17, 148, 154, 159, 166], "insight": [148, 158, 164], "inspect": 9, "inspir": [151, 152, 156, 175], "instabl": [163, 164], "instal": [1, 9, 17, 126, 130, 136, 155, 156, 158, 166, 170], "instanc": [2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 17, 18, 156, 158, 159, 163, 168, 178], "instanti": [9, 14, 17, 18, 19, 166, 175], "instead": [2, 10, 11, 14, 15, 127, 131, 137, 140, 147, 155, 156, 158, 159, 161, 162, 164, 166, 178], "institut": [133, 134], "instruct": [136, 148, 156, 166], "insuffici": 164, "int": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 136, 137, 150, 151, 152, 153, 154, 156, 159, 164, 166, 174, 175, 177, 178], "int23": 17, "int32": [6, 8, 10, 14, 18, 159], "int64": [6, 7, 8, 156, 159], "int8": [5, 7], "int_32": 17, "integ": [2, 6, 7, 8, 9, 14, 16, 17, 18, 155, 156, 159, 166], "integr": [9, 156, 170], "intellig": [154, 155, 158, 164], "intend": [3, 14, 17, 148, 151, 152, 153, 154, 172, 175], "intens": 148, "interact": [5, 9, 14, 17, 20, 148, 158, 159, 164, 166, 174, 178], "interest": [18, 156, 162, 170], "interestingli": 175, "interfac": [9, 156, 157, 158], "interlink": 158, "intermedi": [140, 141, 159], "intermitt": 17, "intern": [2, 3, 10, 155, 156, 159, 161, 162], "internet": 148, "interoper": 148, "interv": [7, 137, 139, 140, 147, 162], "intrins": 168, "introduc": [137, 140, 141, 148, 155, 156, 160, 161], "introduct": [131, 150, 151, 152, 160, 175], "introductori": 156, "invalid": [2, 7, 156, 159, 170, 174], "invers": 4, "invert": [135, 136, 177], "inverted_double_pendulum": 142, "inverted_pendulum": [143, 177], "inverteddoublependulum": [136, 142], "invertedpendulum": [136, 143, 177], "investig": 156, "involv": [6, 126, 142, 148, 151, 152, 153, 154, 155, 156, 166, 177], "io": [18, 148, 153], "ipynb": [166, 167, 168, 170, 174, 175, 177, 178], "irrelev": 159, "irrespect": 9, "is_avail": 178, "is_bound": 7, "is_np_flatten": [5, 156], "is_rain": 154, "is_raini": 154, "is_slipperi": [151, 152, 153, 156, 175], "is_slippi": 156, "is_vector_env": 9, "isaac": 148, "isinst": 156, "isn": [6, 9, 156, 159, 162], "isort": 156, "issu": [17, 18, 129, 132, 136, 137, 139, 140, 141, 142, 143, 144, 145, 147, 155, 156, 161, 162, 166], "itch": 153, "item": [9, 13, 18, 174, 175, 178], "iter": [5, 6, 12, 13, 156, 159], "itomori": 148, "its": [2, 9, 16, 17, 129, 135, 136, 137, 139, 141, 144, 147, 148, 156, 158, 161, 175, 177, 178], "itself": [3, 8, 10, 11, 12, 15, 17, 155, 156, 158, 159, 160, 178], "j": [156, 177, 178], "jack": 150, "jair": 154, "jamartinh": 156, "jax": [2, 14, 17, 20, 148, 156, 163], "jax_to_numpi": 156, "jaxenv": [14, 17], "jaxtonumpi": [14, 17, 20, 156], "jaxtotorch": [14, 17, 20, 156], "jessefarebro": 155, "jet": 156, "jfpettit": 155, "jimini": 148, "jin": 156, "jit": 163, "jjshoot": [155, 156], "jkterry1": 155, "jnp": 17, "job": [148, 166], "job_statu": 6, "john": 156, "johnminelli": 155, "johnnycode8": 172, "join": [5, 156], "joint": [127, 129, 131, 132, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "joint0": 145, "joint1": 145, "jordan": [137, 156, 178], "journal": 154, "journei": [155, 174], "json": 156, "json_env_spec": 156, "jsonabl": 5, "jump": 170, "jumpi": 156, "jun": 156, "junk": 14, "jupyt": [1, 155, 166, 167, 168, 170, 171, 174, 175, 177, 178], "just": [3, 13, 15, 143, 145, 155, 156, 158, 159, 161, 163, 164, 166, 170, 178], "k": [8, 9, 14, 129, 146, 156, 178], "kad99kev": 156, "kalli": 170, "kallinteri": [156, 170], "karp": 178, "kavukcuoglu": 178, "kde": 175, "keep": [9, 14, 17, 18, 20, 132, 141, 143, 159, 164, 166], "keep_dim": [14, 18], "kei": [2, 4, 5, 6, 7, 9, 10, 14, 17, 18, 20, 137, 138, 139, 140, 141, 146, 147, 151, 152, 153, 154, 155, 156, 158, 164, 166, 167, 168, 174, 175], "kellycoinflip": 155, "kept": [10, 136, 170], "kerajli": 156, "kexianshen": 155, "key_to_act": 9, "keyb0ardninja": 156, "keyboard": [7, 9, 155], "keys_to_act": [9, 155, 178], "keyword": [4, 6, 10, 11, 12, 14, 131, 132, 150, 155, 156, 158, 166, 174], "kg": [155, 156], "khoda81": 156, "kind": 7, "king": 150, "kir0ul": [155, 156], "klimov": [126, 127, 128, 129], "knee": [127, 140, 141], "know": [2, 156, 158, 159, 161, 163, 164, 166], "knowledg": [4, 164], "known": [2, 164], "krimmel": 156, "kvrban": 156, "kwarg": [3, 4, 9, 10, 11, 12, 14, 15, 137, 138, 139, 140, 146, 147, 156, 160, 166], "kwiatkowski": 156, "l": [14, 17, 146, 156, 162], "l2r": 148, "lab_black": 175, "label": [162, 174, 175], "laboratori": 148, "lack": 156, "ladder": 127, "lai": 141, "lake": [149, 155, 156], "lam": 178, "lambaactionv0": 156, "lambda": [11, 12, 14, 16, 17, 18, 19, 156, 162, 164, 174, 178], "lambdaact": 14, "land": 129, "lander": [126, 155, 156], "lane": 148, "lap": [128, 155], "lap_complete_perc": 128, "larg": [11, 129, 134, 137, 138, 139, 140, 141, 144, 145, 146, 147, 148, 155, 156, 163, 164, 168, 170, 175], "larger": [164, 178], "largest": 155, "last": [9, 13, 14, 17, 18, 20, 141, 144, 145, 155, 156, 162, 166, 167, 175], "latent": 148, "later": [129, 158, 159, 162, 164, 174, 177, 178], "latest": [2, 163, 177], "latin": 7, "latter": [151, 152], "lava": 2, "layer": [3, 15, 158, 159, 177], "lazili": 5, "lazyfram": 18, "lead": [161, 178], "learn": [2, 5, 6, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 138, 142, 143, 146, 148, 149, 150, 151, 152, 154, 155, 156, 157, 162, 163, 166, 170, 171, 172, 176, 178], "learner": 175, "learning_r": [164, 174, 175, 177], "learnt": 4, "least": [7, 129, 136], "leav": [132, 142, 166, 175], "left": [7, 127, 128, 129, 132, 133, 137, 140, 141, 142, 143, 147, 151, 152, 153, 154, 158, 159, 166, 170, 174, 175, 177], "left_elbow": [140, 141], "left_elfbow": [140, 141], "left_foot": [140, 141], "left_hip_i": [140, 141], "left_hip_x": [140, 141], "left_hip_z": [140, 141], "left_hiz_z": [140, 141], "left_kne": [140, 141], "left_lower_arm": [140, 141], "left_shoulder1": [140, 141], "left_shoulder2": [140, 141], "left_sin": [140, 141], "left_thigh": [140, 141], "left_upper_arm": [140, 141], "leg": [127, 129, 137, 139, 140, 141, 147], "leg_joint": [139, 147], "leg_left_joint": 147, "legaci": 155, "legend": [162, 174, 175], "legend_el": 174, "len": [6, 17, 162, 164, 168, 174, 178], "length": [4, 6, 7, 9, 11, 12, 14, 17, 20, 127, 131, 132, 133, 134, 146, 148, 153, 154, 155, 156, 158, 162, 164, 174, 178], "length_mask": 6, "length_moving_averag": [164, 174], "length_queu": [14, 17, 162, 164, 174], "leq": 142, "less": [127, 129, 146, 147, 158, 164, 175], "lesson": 175, "let": [148, 156, 158, 159, 164, 166, 168, 174, 175, 177], "letter": [153, 154, 155], "level": [9, 15, 158, 162, 170], "levin": [137, 178], "lg": 156, "li": [141, 156], "lib": [151, 152], "librari": [148, 156, 157, 161, 166, 170], "licens": [155, 156, 166, 174, 175, 177, 178], "lidar": 127, "life": [17, 155, 156, 177], "lift": 144, "light": 148, "lighter": 156, "lightgreen": 174, "lightli": 161, "lightweight": [148, 162], "ligibl": 177, "like": [3, 5, 7, 9, 13, 14, 15, 16, 17, 18, 19, 20, 138, 143, 147, 148, 154, 155, 156, 158, 159, 162, 164, 166, 168, 170, 172, 178], "lillicrap": 178, "limit": [17, 20, 132, 143, 155, 156, 158, 159, 161, 163, 164, 169, 171, 174, 177, 178], "lin826": 155, "linalg": [9, 159, 166], "line": [2, 5, 131, 155, 156, 159, 166], "linear": [10, 129, 131, 142, 143, 146, 177, 178], "linearli": [14, 16, 18, 20, 131, 142, 143, 177], "linecolor": 175, "lineplot": [175, 177], "linewidth": [162, 174, 175], "link": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 131, 137, 145, 146, 156, 166], "linux": 156, "list": [2, 4, 5, 6, 7, 9, 10, 11, 12, 14, 15, 17, 18, 155, 156, 158, 159, 162, 174, 175, 178], "list_info": 14, "listdir": 17, "liter": 156, "littl": [129, 156, 159, 164], "live": [1, 9, 159, 174], "ll": [155, 158, 159, 162, 164, 174, 178], "llvm": 148, "load": [4, 155, 156, 169, 171], "load_env_cr": 4, "load_ext": 175, "load_quadruped_model": 170, "load_state_dict": 178, "load_weight": 178, "loc": [154, 178], "local": 166, "localhost": 1, "locat": [4, 136, 148, 151, 152, 153, 154, 159, 166], "log": [2, 9, 14, 16, 17, 18, 19, 162, 175, 177, 178], "log_prob": [177, 178], "logan": 156, "logger": [17, 155], "logic": [11, 128, 155, 156, 159, 164, 166, 170], "logical_or": 156, "logit": 178, "long": [7, 9, 17, 132, 143, 148, 155, 156, 159, 162, 164], "longer": [2, 136, 137, 139, 143, 147, 155, 156, 161, 177], "look": [5, 9, 17, 158, 161, 162, 166, 167, 168, 175, 178], "loop": [148, 161, 174, 178], "lose": [129, 150, 164, 174], "loss": [17, 150, 164, 177, 178], "lost": 17, "lot": [15, 164, 168, 174, 177], "low": [2, 6, 7, 8, 12, 13, 14, 18, 131, 132, 134, 135, 155, 156, 164, 168, 178], "lower": [7, 14, 15, 19, 20, 140, 141, 155, 158, 164, 174, 178], "lower_waist": [140, 141], "lpizzinidev": 156, "lr": [161, 164, 174, 175, 177, 178], "lt": [155, 156], "lucasalegr": 156, "lunar": [126, 155, 156], "lunar_land": [129, 156], "lunarland": [17, 129, 155, 156, 157, 161, 164, 178], "lunarlandercontinu": 168, "lwaist": [140, 141], "lz4": 18, "m": [8, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 170, 178], "mab": 148, "machado": [16, 17], "machin": [155, 175, 177], "made": [1, 129, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 161, 170, 172, 178], "magnitud": [9, 129, 134, 142, 143, 177], "mahiuchun": 155, "mai": [2, 5, 7, 8, 9, 11, 14, 15, 16, 18, 19, 151, 152, 153, 158, 161, 166, 170, 178], "main": [2, 129, 139, 147, 156, 161, 170, 175], "main_bodi": [137, 170], "mainli": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "maintain": [136, 148, 155, 156, 157, 161, 172], "mainten": 155, "major": [155, 156], "make": [1, 2, 6, 9, 11, 12, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 160, 161, 162, 164, 168, 169, 170, 171, 174, 175, 177, 178], "make_dict": 14, "make_vec": [2, 4, 9, 10, 11, 12, 14, 132, 156, 159, 163, 178], "malici": 156, "manag": [4, 13, 148, 164], "mandatori": [159, 166], "manhattan": [159, 166], "mani": [7, 14, 17, 136, 148, 155, 156, 159, 161, 164, 166, 174, 175], "manipul": 148, "manner": [3, 7, 18, 20, 155], "mantasu": 156, "manual": [9, 14, 158, 178], "manual_se": 177, "manuel": 156, "manufactur": 170, "map": [9, 14, 17, 153, 154, 156, 158, 159, 164, 166, 174, 177], "map_nam": 153, "map_siz": 175, "mar": [148, 156], "mariojerez": 156, "marionj": 156, "mark": 156, "markdown": 1, "market": 148, "markov": [148, 156, 158, 167], "markovian": 148, "marku": 156, "markus28": [155, 156], "marsexplor": 148, "mask": [5, 6, 7, 148, 154, 155, 156, 178], "mass": [129, 137, 140, 141, 146], "massiv": 155, "master": [18, 151, 152, 155, 158, 177], "match": [4, 8, 11, 12, 16, 132, 156], "math": [135, 148, 155, 164], "mathbb": 7, "mathcal": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "mathemat": [5, 158, 177], "matplotlib": [9, 162, 164, 174, 175, 177, 178], "matpoliquin": 156, "matric": [5, 148], "matrix": [6, 140, 141, 148], "matter": [7, 155, 159, 161], "matyasch": 156, "max": [4, 7, 14, 16, 17, 18, 20, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 153, 156, 161, 164, 174, 175, 177, 178], "max_a": 167, "max_act": [14, 15, 16, 20], "max_episode_step": [4, 17, 156, 159, 166, 170, 178], "max_geom": 136, "max_id": 175, "max_length": 7, "max_ob": [14, 18, 20], "max_reward": [10, 14, 19, 156, 168], "max_time_step": [132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "maxandskipenv": 18, "maxandskipobserv": [18, 20, 156], "maxim": [159, 164, 177, 178], "maximis": 163, "maximum": [4, 7, 9, 14, 17, 18, 20, 129, 131, 135, 142, 156, 158, 164, 166, 175, 178], "maxq": 154, "mayb": [2, 175], "maze": 159, "mclean": 156, "md": [1, 155, 156, 166], "mdp": [2, 17, 133, 134, 148, 158], "mean": [2, 14, 18, 19, 20, 131, 139, 144, 155, 156, 164, 166, 175, 177, 178], "meaning": 164, "meant": 3, "meantim": 156, "measur": [9, 127, 135, 141, 142, 144, 145, 155, 159], "mechan": 156, "medium": 148, "mel": 153, "melbourn": 175, "melt": 177, "member": 5, "memori": [5, 17, 133, 134, 155, 156, 162, 163], "menageri": 170, "mention": [156, 177], "menu": 158, "mere": 166, "merg": 156, "meshcat": 148, "meshgrid": 174, "messag": [5, 155, 156, 162], "meta": [148, 155], "metaclass": 155, "metadata": [2, 3, 9, 10, 15, 17, 155, 156, 166, 168], "metatrad": 148, "metaworld": 148, "meter": [135, 148], "meth": [7, 17], "method": [3, 4, 6, 9, 14, 16, 17, 18, 19, 148, 155, 156, 159, 160, 161, 164, 166, 168, 177, 178], "methodologi": 148, "metric": [2, 9, 156, 162, 178], "mgoulao": 156, "micim": 155, "microgrid": 148, "mid": 161, "middl": [139, 147, 164], "might": [2, 5, 7, 8, 15, 16, 158, 159, 163, 166, 168, 174, 177, 178], "migrat": [136, 156], "mihaic": 156, "mileston": 162, "miller": 175, "min": [7, 14, 16, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "min_act": [14, 15, 16, 20], "min_length": 7, "min_ob": [14, 18, 20], "min_reward": [10, 14, 19, 156, 168], "minari": 148, "minatari": 148, "mind": 156, "mine": 148, "minecraft": 148, "minesweep": 148, "minetest": 148, "miniatur": 148, "minibatch": 178, "minigrid": [148, 156], "minim": [2, 148, 156, 159, 166, 167, 175, 178], "minimalist": 148, "minimum": [7, 14, 18, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 158, 159, 164, 175], "miniwob": 148, "miniworld": 148, "minor": [155, 156], "mirza": 178, "misc": [155, 156], "mischapanch": 156, "miss": [131, 154, 155, 156, 158, 159, 162], "mission": 5, "mistak": [156, 158, 159], "mit": [131, 174, 175, 177, 178], "mitig": 178, "mixtur": 156, "mj_camera": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "mj_step": [137, 140], "mjcf": 170, "mjdata": 136, "mjtvisflag": 136, "mjvcamera": 136, "mjvis_contactforc": 136, "mjvis_contactpoint": 136, "mjvisual": 136, "mkdir": 178, "ml": [148, 155], "mmcaulif": 156, "mnih": 178, "mo": 148, "moba": 148, "mobil": 148, "modal": 136, "mode": [2, 4, 10, 11, 12, 14, 155, 156, 158, 162, 164, 166, 174, 178], "model": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 156, 159, 161, 172, 174], "modern": [148, 161], "modif": 168, "modifi": [2, 4, 5, 10, 14, 15, 16, 18, 19, 20, 131, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 159, 166, 168], "modul": [4, 5, 13, 155, 156, 166, 168, 177, 178], "modular": [14, 15, 148, 158, 166, 168], "module_nam": 156, "moduletyp": [14, 17], "mojoco": 172, "moment": 3, "monitor": [17, 155, 156, 162], "monop": 136, "mont": [164, 174, 177, 178], "month": 156, "moon": 129, "moor": [133, 134], "moore90efficientmemori": [133, 134], "more": [1, 2, 5, 6, 7, 10, 11, 12, 14, 15, 16, 19, 20, 127, 129, 136, 137, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 161, 163, 164, 166, 167, 168, 170, 174, 175, 177, 178], "moreov": [5, 14, 15, 17, 166, 168], "moritz": [137, 178], "most": [2, 5, 7, 13, 14, 15, 17, 18, 136, 145, 148, 155, 156, 158, 161, 163, 164, 166, 168, 170, 171, 173, 174, 176], "mostli": [155, 164], "motion": 148, "motor": [127, 146, 148, 155, 170], "motor1_rot": 146, "motor2_rot": 146, "mountain": [130, 155, 158], "mountaincar": [14, 133, 164, 172], "mountaincarcontinu": [14, 16, 19, 134], "mountaincarenv": 133, "move": [2, 14, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 129, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 153, 154, 155, 156, 158, 159, 161, 162, 164, 166, 167, 170, 175, 177], "movement": [154, 159, 164, 166], "moviepi": [9, 17, 155, 156], "moving_avg": 162, "mozer": 131, "mp": 13, "mp4": 162, "mpi": 13, "mpi4pi": 13, "mpi_init": 13, "mt19937": 155, "mtsim": 148, "much": [155, 156, 159, 161, 164, 166, 167, 170], "mujoco": [1, 9, 15, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 168, 170, 171, 176], "mujoco_env": [155, 156], "mujoco_gl": 136, "mujoco_menageri": 170, "mujoco_reinforc": 177, "mujoco_rend": 155, "mujocoenv": 156, "mujocorend": 156, "mujocorender": 156, "multi": [2, 7, 136, 140, 141, 144, 148, 159], "multiag": 148, "multibinari": [5, 6, 7, 8, 13, 18, 156, 158], "multidiscret": [5, 6, 7, 8, 10, 13, 18, 155, 156, 158, 166], "multimod": 148, "multipl": [5, 6, 7, 10, 11, 12, 13, 155, 156, 158, 159, 162, 163, 178], "multipli": [6, 129, 134, 144, 145, 178], "multiprocess": [5, 11, 13, 178], "multivari": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "must": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 128, 136, 139, 147, 155, 156, 159, 164, 166, 167], "mutual": 136, "my": 175, "my_packag": 159, "mypi": [2, 156], "n": [4, 5, 6, 7, 8, 11, 12, 13, 17, 18, 20, 128, 131, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 162, 164, 174, 175, 177, 178], "n_action": 178, "n_env": 178, "n_episod": [164, 174], "n_featur": 178, "n_run": 175, "n_showcase_episod": 178, "n_steps_per_upd": 178, "n_updat": 178, "na": 145, "name": [1, 3, 4, 11, 12, 15, 20, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 159, 162, 166], "name_prefix": [9, 17, 162], "namedtupl": [156, 175], "namespac": [4, 159, 166], "nanoquadrotor": 148, "narrow": 175, "nativ": 17, "natur": [148, 150, 153, 161, 164, 174], "naverag": 162, "navig": [148, 154, 159, 166, 168], "nbodi": [137, 140, 141], "nchain": 155, "ncol": [151, 152, 153, 164, 174, 175, 178], "ncrement": 177, "ndarrai": [2, 3, 6, 7, 8, 9, 13, 14, 16, 17, 18, 19, 131, 132, 133, 134, 135, 154, 177, 178], "neccari": 9, "necessari": [2, 5, 126, 155, 156], "necessarili": 8, "need": [2, 5, 6, 9, 14, 15, 16, 18, 127, 129, 132, 136, 155, 156, 158, 159, 161, 162, 163, 164, 166, 167, 168, 170, 174, 175, 178], "need_visu": 161, "neg": [2, 7, 9, 134, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 154, 158, 159, 164, 177], "neither": [7, 17, 150, 154], "nerdyespresso": 156, "nervous": 127, "nest": [6, 13, 148], "net": [128, 150, 151, 152, 177, 178], "network": [5, 8, 10, 13, 146, 148, 158, 159, 164, 178], "neural": [5, 8, 10, 13, 131, 146, 148, 159, 164, 177, 178], "neurip": 131, "neuro": 148, "neuroflight": 148, "neuronlik": [132, 142, 143], "nevalu": 162, "never": [2, 138, 141, 144, 145, 146, 156], "nevertheless": 168, "new": [2, 5, 14, 15, 16, 17, 18, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 146, 147, 154, 155, 156, 157, 158, 159, 160, 163, 164, 166, 167, 168, 170, 174, 175, 178], "new_action_spac": 14, "new_obs_spac": 14, "new_po": 159, "new_q": 164, "new_spac": 14, "new_stat": 175, "new_throughput": 9, "newer": [136, 155], "newli": [14, 18, 19], "newlin": 2, "next": [2, 3, 10, 13, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 156, 157, 170, 177], "next_ob": [156, 161, 164, 174, 177], "next_stat": [3, 156, 164, 174], "next_step": [11, 12], "next_valu": 161, "nice": 155, "nidhish": 156, "nine": 137, "nintendo": 7, "nip": 131, "nlp": 148, "nlpgym": 148, "nn": [177, 178], "no_grad": 178, "node": [5, 6, 8, 155, 158], "node_spac": [6, 8], "nois": [130, 136, 156], "noisi": [162, 164], "non": [2, 5, 8, 9, 14, 17, 129, 132, 137, 138, 139, 140, 141, 146, 147, 148, 153, 155, 156, 159, 166, 167, 177], "non_random_ob": 128, "nonbreak": 155, "nondeterminist": [4, 166], "none": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 136, 153, 155, 156, 158, 159, 161, 166, 174, 175, 178], "nonlinear": 139, "noop": [7, 9, 17, 154, 156, 178], "noop_max": [17, 156], "nor": [7, 17, 150, 151, 152, 154], "norm": [9, 144, 145, 159, 166], "normal": [2, 4, 7, 10, 13, 14, 17, 18, 19, 20, 127, 128, 135, 137, 138, 142, 155, 156, 163, 164, 177, 178], "normalis": 156, "normalize_tim": 18, "normalizeobserv": [14, 18, 20, 155, 156], "normalizereward": [14, 19, 20, 155], "normalizex": 156, "north": 154, "notabl": [155, 156, 167], "note": [1, 5, 9, 13, 14, 17, 18, 131, 132, 136, 137, 139, 140, 141, 142, 144, 147, 154, 158, 161, 163, 167, 170, 174, 177, 178], "notebook": [1, 155, 166, 167, 168, 170, 171, 174, 175, 177, 178], "noth": [3, 128, 129, 156, 159, 177], "notic": 156, "notif": 156, "notimplementederror": 8, "nov": 154, "now": [2, 127, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 159, 164, 166, 167, 170, 174, 175, 177], "np": [2, 5, 6, 7, 9, 10, 12, 13, 14, 16, 18, 19, 129, 133, 140, 141, 154, 155, 156, 159, 162, 164, 166, 168, 170, 174, 175, 177, 178], "np_random": [2, 5, 9, 10, 11, 12, 15, 155, 156, 159, 166], "np_random_se": [2, 10, 11, 12, 15, 156], "nrow": [153, 175, 178], "nstep": 156, "num": [14, 17, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "num_col": 4, "num_edg": 6, "num_env": [4, 10, 11, 12, 13, 14, 132, 156, 159, 178], "num_episod": [161, 164], "num_eval_episod": 162, "num_nod": 6, "num_training_episod": 162, "number": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 16, 17, 18, 20, 128, 129, 131, 136, 139, 140, 141, 146, 147, 148, 150, 153, 155, 156, 158, 159, 160, 162, 163, 164, 166, 170, 175, 177, 178], "numer": [142, 143, 150, 155, 156, 162, 168, 177], "numpi": [2, 5, 7, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 155, 156, 159, 162, 164, 166, 168, 170, 174, 175, 177, 178], "numpytotorch": [14, 17, 20, 156], "nv": [140, 141], "nvec": 7, "nvidia": 148, "o": [17, 162, 177, 178], "o_": 167, "o_t": 167, "ob": [9, 12, 14, 16, 17, 18, 128, 154, 155, 156, 158, 159, 161, 162, 164, 168, 170, 174, 177], "obj_slidei": 144, "obj_slidex": 144, "object": [2, 5, 9, 11, 12, 13, 14, 15, 136, 144, 145, 148, 156, 158, 162, 174, 177], "obs0": 18, "obs1": 18, "obs2": 18, "obs3": 18, "obs4": 18, "obs_kei": 18, "obs_shap": 178, "obs_space_dim": 177, "obs_t": 9, "obs_tp": 9, "obs_tp1": 9, "observ": [2, 3, 4, 5, 6, 9, 10, 11, 12, 13, 15, 17, 19, 20, 148, 155, 156, 157, 161, 163, 164, 167, 168, 175, 177], "observation_mod": [11, 12], "observation_spac": [2, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 18, 158, 159, 166, 168, 175, 177], "observation_structur": [137, 138, 139, 140, 141, 143, 146, 147], "observationwrapp": [14, 15, 18, 166, 170], "obstacl": 159, "obstructview": 156, "obstyp": [2, 3, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 156, 177], "obswrapp": 155, "obtain": [15, 17, 135, 150, 167], "obviou": 167, "obvious": 156, "occur": [2, 10, 131, 132, 166, 178], "octob": 136, "odyse": 170, "off": [17, 128, 129, 151, 152, 154, 155, 156, 158, 159, 175], "offer": 148, "offici": 3, "offlin": [148, 156], "offscreen": [155, 156], "offset": [129, 140, 141], "offworld": 148, "often": [2, 5, 148, 156, 164, 166, 175], "oftentim": 166, "old": [10, 16, 136, 155, 156, 157, 160], "old_epsilon": 164, "old_po": 159, "old_spac": 14, "old_throughput": 9, "oldenv": 161, "older": [136, 156, 160, 161], "oldv21env": 160, "oleg": [126, 127, 128, 129], "olimoyo": 155, "olipinski": [155, 156], "omar": 156, "omega_1": 142, "omega_2": 142, "omesa": 136, "omg": 148, "omit": [137, 138, 139, 140, 141, 146, 147], "omniisaacgymenv": 148, "omnivers": 148, "onc": [1, 17, 154, 155, 159, 161, 164, 166, 174, 178], "one": [2, 5, 6, 7, 8, 9, 11, 15, 16, 131, 132, 133, 134, 135, 136, 137, 139, 142, 143, 146, 150, 154, 155, 156, 159, 160, 162, 164, 167, 168, 170, 174, 175, 177, 178], "oneof": [5, 6, 8, 13, 156], "ones": [14, 130, 155, 164, 174, 178], "ongo": 178, "onli": [2, 4, 5, 6, 7, 8, 9, 10, 17, 18, 131, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 145, 146, 147, 154, 155, 156, 159, 161, 162, 166, 168, 170, 174, 175, 178], "onlin": [140, 141, 150, 151, 152, 161], "onward": 167, "op": [17, 156], "open": [1, 17, 136, 148, 155, 156, 158, 166], "openai": [2, 19, 126, 155, 156, 157, 161, 167, 174, 177], "opencv": [14, 17, 18, 20, 155], "opengl": [136, 156], "openmodelica": 148, "oper": [8, 14, 136, 148, 155], "oppon": 159, "opportun": 148, "opt": 170, "optim": [13, 14, 17, 127, 129, 140, 141, 148, 156, 158, 159, 161, 164, 174, 175, 177, 178], "optimis": [10, 148, 155, 172], "optimist": 164, "option": [2, 3, 4, 5, 6, 7, 10, 11, 12, 14, 15, 18, 128, 131, 132, 133, 134, 135, 136, 148, 155, 156, 158, 159, 161, 166], "ord": [9, 159, 166], "order": [4, 5, 6, 15, 17, 129, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 163, 166, 175], "order_enforc": [4, 166], "ordereddict": 156, "orderenforc": [4, 15, 17, 20, 127, 128, 129, 131, 132, 133, 134, 135, 155, 156, 158, 159, 166], "orderli": 155, "org": [10, 11, 12, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 156, 174, 177, 178], "orient": [129, 137, 140, 141], "origin": [8, 10, 14, 16, 17, 18, 128, 131, 132, 136, 142, 155, 156, 158, 159, 161, 164, 170], "orsini": 155, "osmesa": 136, "other": [14, 16, 20, 129, 135, 136, 138, 140, 142, 146, 147, 153, 154, 155, 156, 158, 160, 161, 162, 164, 166, 168, 170, 172, 174, 175, 177, 178], "otherwis": [2, 4, 6, 7, 9, 11, 12, 14, 17, 18, 139, 155, 156, 159, 174, 175], "our": [156, 158, 159, 161, 164, 166, 170, 174, 175, 178], "out": [2, 3, 13, 14, 15, 148, 155, 156, 166, 167, 168, 172, 177], "outcom": [150, 175], "outer": 131, "outermost": 14, "outlin": [150, 155, 158, 159, 164, 174], "output": [1, 9, 10, 13, 14, 17, 155, 156, 158, 159, 166, 174, 177, 178], "output_truncation_bool": 9, "outsid": [2, 14, 18, 128, 129, 155, 156, 159, 167], "outweigh": 156, "over": [5, 9, 13, 17, 138, 140, 150, 153, 155, 156, 158, 162, 164, 168, 170, 174, 178], "overal": 156, "overcom": 175, "overfit": [170, 178], "overflow": 156, "overhaul": 156, "overhead": 129, "overrid": [4, 11, 14, 156, 168], "overview": 177, "overwrit": [16, 18, 19], "overwritten": [15, 155, 156], "own": [11, 15, 148, 156, 158, 161, 162, 164, 168, 169, 170, 171], "p": [138, 148, 151, 152, 153, 154, 155, 175, 178], "p_": [144, 145], "p_0": 148, "pace": 148, "packag": [1, 10, 17, 126, 136, 148, 155, 156, 159, 175], "package_data": 155, "pad": [18, 129, 156], "padding_typ": [18, 156], "page": [16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 156, 158, 159, 161, 163, 164, 172], "painlessli": 5, "pair": [136, 140, 141, 164], "palett": 177, "pan": 144, "panda": [148, 175, 177], "paper": [131, 142, 148, 156, 162, 163], "paradigm": 2, "parallel": [10, 11, 12, 14, 148, 156, 159, 162, 163, 178], "param": [3, 7, 9, 156, 175], "paramet": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 161, 164, 166, 168, 177, 178], "parameter": [2, 177, 178], "parameter_tun": 155, "parametr": [5, 177], "parent": 13, "pars": 4, "parse_env_id": 4, "parser": 156, "part": [17, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 159, 167, 170, 175], "parti": [136, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 166], "partial": [2, 148, 155, 156, 159], "particular": [5, 6, 9, 10, 20, 129, 156, 158, 160, 163, 167, 170, 175], "particularli": [9, 17, 18, 132, 156, 159], "pass": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 128, 137, 138, 139, 140, 141, 146, 147, 155, 156, 158, 159, 160, 161, 166, 168, 178], "passeng": 154, "passenger_loc": 154, "passidx": 154, "passiv": [17, 20, 155, 156], "passiveenvcheck": [4, 15, 17, 20, 127, 128, 129, 131, 132, 133, 134, 135, 156, 158, 159], "past": [14, 18, 19, 155], "patch": [155, 174], "path": [4, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 156, 159, 162, 166, 178], "patienc": [155, 164], "pattern": [161, 162], "paulmest": 156, "paw": 138, "pcg64": 155, "pd": [175, 177], "pdf": [131, 150, 151, 152], "peg": 155, "pelvi": [140, 141], "penal": [137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 168], "penalis": [133, 134], "penalti": [154, 159], "pend": [11, 155], "pendulum": [11, 12, 18, 130, 131, 132, 136, 155, 158, 177], "pendulumenv": 135, "per": [7, 9, 10, 17, 129, 132, 154, 155, 161, 163, 164, 167, 170, 178], "percentag": [128, 174], "peretz": 156, "perez": 156, "perf_count": 155, "perfect": [158, 159, 164], "perfectli": 166, "perform": [2, 5, 14, 17, 145, 155, 156, 158, 160, 162, 163, 164, 170, 177], "period": 139, "perman": [144, 145], "permiss": [155, 156], "perpendicular": [151, 152, 153, 175], "perpendicularli": 142, "person": 131, "perspect": 148, "perturb": [137, 138, 139, 140, 141, 142, 143, 146, 147], "pet": 158, "pettingzoo": [2, 148, 155], "pge": 148, "phase": [148, 159, 178], "phd": [133, 134, 146], "philosoph": 9, "photorealist": 148, "phys2d": 17, "physic": [2, 126, 136, 142, 143, 144, 145, 148, 155, 156, 159, 177], "pi": [129, 131, 133, 135], "pick": [154, 164, 170, 174, 175, 178], "pickl": [1, 13, 155, 156], "pickled_env_spec": 156, "pickup": 154, "pictur": [158, 162], "piec": 166, "pierrecounath": 156, "pierremardon": 156, "pierr\u00e9": [156, 175], "pinocchio": 148, "pip": [1, 126, 130, 136, 155, 156, 158, 166, 170], "pip3": 155, "pipe": [11, 155], "pipx": 166, "pirata": 155, "pitfal": 127, "pix_square_s": 166, "pixel": [2, 18, 128, 148, 158, 161, 166], "pixelobservationwrapp": [18, 155, 156], "pixelobswrapp": 155, "pixels3d": 166, "pkuderov": 156, "place": [9, 17, 132, 133, 134, 156, 159, 166, 178], "plai": [9, 128, 148, 155, 156, 158, 159, 164, 174], "plan": [148, 155, 156, 159], "plateau": 164, "platform": 148, "playablegam": 9, "player": [148, 150, 151, 152, 153, 154, 164, 174, 175], "player_count": 174, "player_sum": 164, "playfield": 128, "playplot": [9, 156], "pleas": [2, 5, 7, 18, 136, 148, 155, 156, 159, 164, 172], "plot": [1, 9, 162, 164, 174, 175], "plot_nam": 9, "plot_q_values_map": 175, "plot_states_actions_distribut": 175, "plot_steps_and_reward": 175, "plot_surfac": 174, "plotter": 9, "plt": [162, 164, 174, 175, 177, 178], "plu": [7, 151, 152, 156, 162, 164], "plugin": [155, 156], "pm": 129, "png": 170, "point": [4, 8, 9, 15, 127, 128, 129, 131, 132, 135, 136, 145, 150, 155, 156, 159, 167], "pointless": 156, "pole": [2, 130, 136, 142, 143, 148, 158, 177], "pole2": 142, "pole_angl": 158, "pole_angular_veloc": 158, "poli": 148, "polici": [2, 14, 18, 19, 130, 136, 137, 138, 139, 140, 141, 146, 147, 148, 155, 156, 157, 158, 162, 164, 167, 170, 175, 178], "policy_grid": 174, "policy_mean_net": 177, "policy_network": 177, "policy_stddev_net": 177, "polygon": 155, "pomdp": 3, "pong": [17, 156, 161], "pontryagin": 129, "pool": [17, 146], "poorli": 159, "pop": [2, 155, 156], "pop_fram": 17, "popular": [14, 17, 126, 148, 156, 164, 174], "pose": 148, "posit": [2, 6, 7, 8, 9, 11, 13, 17, 127, 128, 129, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 151, 152, 153, 154, 156, 158, 159, 166, 168, 174], "position_fingertip": 145, "position_target": 145, "possibl": [2, 5, 6, 7, 8, 14, 16, 17, 129, 131, 132, 133, 134, 136, 138, 140, 143, 146, 151, 152, 153, 154, 155, 156, 158, 159, 161, 162, 164, 166, 170, 174, 175], "possibli": [7, 13, 15, 17, 159, 178], "post": [155, 156, 161, 175], "postprocess": 175, "potenti": [156, 161], "pow": 178, "power": [17, 128, 129, 134, 142, 143, 148, 177], "pp": 154, "ppo": 172, "pprint": [14, 156], "pprint_registri": [2, 4, 156, 158, 159], "pr": [140, 148, 155, 156], "practic": [148, 155, 158, 161, 164, 167, 174], "practition": 162, "pre": [4, 5, 153, 156, 166], "precis": [6, 155], "predefin": 166, "predict": [139, 148, 164, 177, 178], "predominantli": 3, "prefix": 162, "preload": 153, "premad": 148, "prematur": 2, "prepend": [9, 17], "preprocess": [9, 17, 20, 155, 156], "present": [131, 148, 155, 162, 167, 174], "preserv": [161, 167], "press": [7, 9, 128, 131, 158], "pressur": 159, "pretti": [4, 156, 175], "prevent": [3, 7, 11, 155, 156, 158, 159, 161], "previou": [17, 156, 167, 168], "previous": [4, 9, 18, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 160], "primarili": [148, 156], "primaryclass": 156, "principl": 129, "print": [4, 156, 158, 159, 162, 164, 166, 168, 170, 175, 177, 178], "print_registri": 4, "prior": 4, "priori": 148, "privat": 166, "prng": [2, 5, 6, 7], "proabil": [151, 152], "prob": [177, 178], "proba_frozen": 175, "probabl": [5, 6, 7, 16, 20, 151, 152, 153, 154, 156, 161, 164, 167, 174, 175, 177, 178], "problem": [17, 129, 132, 135, 137, 140, 141, 142, 143, 146, 148, 150, 154, 156, 157, 158, 161, 163, 164, 167, 170, 178], "procedur": 177, "proceed": 131, "process": [9, 10, 11, 13, 14, 18, 131, 148, 156, 158, 166, 167, 178], "process_ev": 9, "produc": [2, 17, 20, 155, 156, 166], "product": [6, 7, 177], "program": [10, 11, 12, 148, 156], "progress": [6, 9, 156, 159, 162, 164, 178], "project": [9, 148, 155, 156, 159, 161, 162, 166, 174], "prompt": 156, "propag": 175, "proper": [155, 158, 161], "properli": [1, 5, 155, 158, 159, 161, 170], "properti": [2, 5, 10, 11, 12, 14, 15, 18, 19, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 167], "proport": 178, "propos": [16, 156], "protocol": 17, "prototyp": 148, "prove": 148, "prover": 148, "provid": [2, 5, 6, 7, 9, 10, 11, 14, 16, 17, 18, 20, 126, 127, 131, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 160, 161, 162, 163, 164, 166, 172, 174], "psc": 155, "pseudo": [155, 156, 178], "pseudorandom": [5, 7], "publicli": 156, "publish": 156, "pull": [18, 19, 155], "pump": 166, "pure": 164, "purpos": [3, 5, 155, 161, 162], "push": [129, 132, 136, 142, 143, 148, 156, 158, 177], "pusher": [136, 156], "pusher_v5": 144, "put": [155, 166, 175], "puzzl": 148, "py": [1, 9, 126, 127, 128, 129, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 151, 152, 155, 156, 166, 167, 168, 170, 174, 175, 177, 178], "pybullet": 148, "pycharm": 156, "pydoc": 155, "pyflyt": [148, 156], "pygam": [2, 9, 126, 155, 156, 166], "pyglet": 155, "pypi": [155, 156], "pyplot": [162, 164, 174, 175, 177, 178], "pyproject": 166, "pyright": [2, 155, 156], "pystk2": 148, "python": [1, 17, 126, 127, 128, 129, 148, 155, 156, 157, 158, 159, 161, 166, 167, 168, 170, 171, 172, 174, 175, 177, 178], "pytorch": [14, 17, 20, 156, 163, 172, 177], "q": [154, 162, 167, 171, 172, 176, 178], "q_": 167, "q_tabl": 161, "q_target": 167, "q_updat": 175, "q_valu": [154, 164, 174], "qfrc_actuat": [140, 141], "qfrc_constraint": 142, "qgallouedec": 156, "qlearn": 175, "qpo": [136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "qtabl": 175, "qtable_best_act": 175, "qtable_direct": 175, "qtable_directions_map": 175, "qtable_val_max": 175, "quad": 141, "quad_ctrl_cost": 141, "quad_impact_cost": 141, "quadcopt": 148, "quadrotor": 148, "quadrup": [136, 137, 156, 169, 171], "quagla": 155, "qualiti": [10, 148, 156], "quaternion": [137, 140, 141], "queen": 150, "question": [148, 161, 166], "queue": [11, 162], "quicker": 178, "quickli": [133, 148, 164, 174, 175], "quit": [11, 156, 166], "qvel": [136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "qwop": 148, "r": [1, 7, 14, 17, 19, 131, 135, 148, 150, 151, 152, 154, 162, 168, 170, 175, 177], "r_": 178, "r_elbow_flex_joint": 144, "r_forearm_roll_joint": 144, "r_shoulder_lift_joint": 144, "r_shoulder_pan_joint": 144, "r_t": 167, "r_upper_arm_roll_joint": 144, "r_wrist_flex_joint": 144, "r_wrist_roll_joint": 144, "race": [126, 148, 155], "racecar": 148, "racecar_gym": 148, "racing_dream": 148, "rad": [131, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "radian": [129, 131, 132, 135, 143], "rafaelcp": 156, "raghuspacerajan": 155, "rainbow": [172, 177], "raini": 156, "rais": [2, 4, 7, 8, 9, 11, 12, 13, 15, 17, 18, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 178], "ram": 163, "rand": 155, "randint": 155, "randn": 155, "random": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 17, 18, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 145, 146, 147, 153, 154, 155, 156, 158, 159, 162, 164, 166, 174, 175, 177], "randomize_domain": 178, "randomize_ob": 128, "randomli": [5, 6, 9, 129, 153, 155, 156, 158, 159, 164, 166, 175, 178], "randomnumbergener": 155, "randomst": 155, "rang": [7, 9, 13, 14, 16, 17, 18, 20, 127, 130, 131, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 161, 162, 164, 166, 168, 170, 171, 173, 174, 175, 176, 177, 178], "rangefind": 127, "raphajan": 156, "rapidli": 148, "rare": [7, 155], "rate": [144, 145, 148, 162, 164, 174, 175, 177, 178], "rather": [2, 4, 6, 128, 155, 156, 162, 174, 178], "raw": [156, 159, 162, 170], "rayerdyn": 156, "rcparam": 177, "rdnfn": 155, "re": [1, 155, 156, 158, 161, 162, 164, 166, 175, 177], "reach": [2, 4, 17, 18, 20, 130, 131, 132, 133, 134, 136, 148, 151, 152, 153, 154, 156, 159, 161, 166, 167, 172, 174, 175, 177], "reachabl": 154, "reacher": [136, 156, 168], "reacher_weighted_reward": 166, "reacherrewardwrapp": 168, "read": [2, 5, 10, 13, 19, 131, 137, 140, 141, 155, 156, 159, 164], "read_from_shared_memori": [5, 13], "readabl": [5, 6, 156, 159], "reader": [163, 170], "readi": [158, 170, 174], "readm": [155, 156, 166], "readthedoc": 18, "real": [9, 138, 148, 158], "realist": [136, 148], "realli": [156, 159, 170, 174], "rear": 128, "reason": [2, 17, 129, 148, 155, 156, 159, 161, 170], "rebuild": 1, "receiv": [9, 18, 19, 20, 128, 129, 134, 147, 154, 155, 157, 158, 164, 167, 174, 177, 178], "recent": [13, 14, 17, 18, 19, 156, 160, 162], "recent_reward": 162, "recogn": 156, "recommend": [3, 4, 9, 11, 17, 129, 136, 137, 140, 141, 155, 156, 159, 170, 174, 178], "reconstruct": 158, "record": [4, 9, 17, 20, 127, 148, 155, 156, 158, 161, 164, 177, 178], "recordconstructorutil": 156, "recorded_fram": 156, "recordepisodestat": 155, "recordepisodestatist": [14, 17, 20, 155, 156, 162, 164, 174, 177, 178], "recordvideo": [17, 20, 155, 156, 162], "recordvideov0": 156, "recreat": 156, "recreated_env": 156, "rect": 166, "red": [154, 155, 166], "redirect": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125], "redtachyon": [155, 156], "reduc": [132, 148, 163, 164, 172, 174, 178], "redund": 155, "refactor": [155, 156], "refer": [2, 4, 5, 7, 9, 136, 156, 157, 163, 166, 167, 170], "referenc": 156, "reflect": [18, 132, 155, 156], "refresh": 175, "regard": 130, "regardless": [137, 138, 139, 140, 141, 146, 147, 170], "regex": 4, "reginald": 156, "regist": [13, 155, 156, 160], "register_env": [17, 156, 161], "registr": [4, 155, 156, 166], "registri": [4, 155, 156], "regress": [9, 156], "regularli": 156, "reinforc": [2, 5, 131, 146, 148, 149, 150, 151, 152, 154, 155, 156, 157, 163, 167, 171, 172, 174, 175, 176, 178], "reiniti": [155, 177], "rel": [131, 140, 141, 156, 166, 168, 178], "relat": [129, 132, 137, 139, 140, 141, 142, 143, 144, 145, 147, 148, 156, 177], "relative_posit": 166, "relativeposit": [166, 168], "releas": [10, 11, 12, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 166], "relev": [155, 160, 166], "reli": 136, "reliabl": 164, "relu": [14, 178], "remain": [18, 151, 152, 155, 161, 166, 167], "remak": 178, "rememb": [17, 128, 164, 166, 168], "remind": [156, 170], "remot": [148, 156], "remov": [2, 4, 17, 18, 137, 138, 139, 140, 141, 145, 146, 147, 154, 155, 156], "renam": [14, 17, 18, 138, 140, 155, 156, 177], "render": [2, 3, 4, 10, 14, 15, 17, 18, 20, 126, 127, 137, 138, 139, 140, 146, 147, 148, 155, 156, 158, 162, 168, 174, 175], "render_clos": 3, "render_fp": [2, 9, 17, 156, 166], "render_imag": 3, "render_init": 3, "render_kei": 18, "render_mod": [2, 3, 9, 10, 15, 17, 18, 127, 128, 131, 132, 133, 134, 135, 136, 155, 156, 157, 158, 159, 160, 161, 162, 166, 170, 175, 178], "render_onli": 18, "render_st": 3, "rendercollect": [2, 17, 20, 156], "renderedfram": [17, 20], "renderfram": [2, 9, 10, 14, 15], "renderstatetyp": 3, "renorm": 129, "rep": 175, "repeat": [4, 16, 18, 20, 156, 158, 159, 164, 175], "repeat_action_dur": 16, "repeat_action_prob": 16, "repeatedli": 158, "rephras": 155, "replac": [17, 18, 137, 146, 150, 155, 156, 158, 162, 164, 166, 170, 174], "replay_buff": 156, "repo": [1, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156], "report": [127, 137, 140, 141, 155, 156, 161], "repositori": [136, 155, 172], "repres": [2, 6, 7, 9, 18, 129, 131, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 153, 154, 155, 156, 157, 158, 159, 166, 170, 175, 177], "represent": [2, 156, 167], "reproduc": [2, 6, 148, 156, 159, 161, 175], "request": [18, 150, 156], "requir": [1, 2, 5, 6, 9, 11, 14, 18, 136, 147, 155, 156, 159, 163, 164, 166, 170, 174, 177, 178], "rerun": 156, "res_al": 175, "rescal": [14, 16, 18, 20, 158], "rescale_act": 155, "rescaleact": [14, 15, 16, 20, 156, 158], "rescaleobserv": [14, 18, 20, 156], "research": [136, 142, 148, 154, 156, 161, 163], "reseed_sampl": 156, "reseed_valu": 156, "reset": [2, 3, 4, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 146, 147, 151, 152, 153, 154, 155, 156, 157, 158, 162, 164, 170, 174, 175, 177, 178], "reset_async": 156, "reset_clean": 17, "reset_noise_scal": [137, 138, 139, 140, 141, 142, 143, 146, 147, 170], "reset_qt": 175, "reset_wait": 156, "resetneed": 17, "reshap": [14, 18, 20, 175], "reshape_env": 18, "reshapeobserv": [14, 18, 20], "resiz": [14, 17, 18, 20, 156], "resized_env": 18, "resizeobserv": [14, 18, 20, 156], "resolv": 155, "resourc": [10, 11, 12, 159, 161, 166, 174], "respect": [14, 15, 17, 129, 131, 137, 138, 139, 140, 141, 146, 147, 155, 156, 158, 168, 178], "respectivesli": 14, "respond": [158, 174], "rest": [128, 129, 139, 147, 156, 159, 178], "restart": 158, "restor": [137, 138, 139, 140, 141, 146, 147, 164], "restrict": 156, "result": [2, 6, 8, 11, 12, 13, 17, 129, 131, 132, 136, 137, 140, 141, 142, 145, 149, 151, 152, 154, 155, 156, 158, 159, 161, 162, 174, 175, 178], "retriev": 4, "retro": [148, 156], "return": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 127, 136, 137, 138, 139, 140, 141, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 158, 159, 161, 164, 166, 167, 168, 174, 175, 177, 178], "return_info": [2, 155], "return_queu": [14, 17, 162, 164, 174, 177, 178], "reveal": [150, 162], "revers": [5, 8, 150, 177, 178], "revert": [155, 156], "revisit": 17, "rew": [9, 14, 17, 19, 167], "reward": [2, 3, 4, 9, 10, 11, 12, 15, 17, 18, 20, 148, 155, 156, 157, 158, 161, 162, 164, 166, 167, 168, 174, 175, 177, 178], "reward_al": 140, "reward_control": [144, 145], "reward_control_weight": [144, 145], "reward_ctrl": [14, 137, 139, 140, 144, 145, 147, 168], "reward_ctrl_weight": 168, "reward_dist": [144, 145, 168], "reward_dist_weight": [144, 145, 168], "reward_forward": [137, 138, 139, 140, 146, 147], "reward_fwd": 146, "reward_linvel": 140, "reward_moving_averag": [164, 174], "reward_near": 144, "reward_near_weight": [144, 145], "reward_over_episod": 177, "reward_quadctrl": 140, "reward_rang": 156, "reward_run": [14, 138], "reward_scal": 159, "reward_surv": [137, 139, 140, 142, 143, 147], "reward_threshold": [4, 137, 138, 139, 140, 141, 144, 145, 146, 147, 156, 166], "rewards_df": 175, "rewards_over_se": 177, "rewardtyp": [3, 156], "rewardwrapp": [14, 15, 19, 170], "rewrit": [155, 156], "rgb": [2, 14, 17, 18, 20, 128, 137, 138, 139, 140, 146, 147, 155, 156, 158], "rgb_arrai": [2, 3, 9, 17, 18, 20, 127, 128, 131, 132, 133, 134, 135, 136, 155, 156, 158, 161, 162, 166, 170, 175, 178], "rgb_array_list": [2, 9, 17, 155], "rgbd": 156, "rgbd_tupl": 136, "richard": 175, "ride": [158, 164], "right": [2, 7, 127, 128, 129, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 146, 147, 151, 152, 153, 154, 156, 158, 159, 164, 166, 174, 175, 177], "right_back_leg": 137, "right_elbow": [140, 141], "right_foot": [140, 141], "right_hip_i": [140, 141], "right_hip_x": [140, 141], "right_hip_z": [140, 141], "right_kne": [140, 141], "right_lower_arm": [140, 141], "right_shoulder1": [140, 141], "right_shoulder2": [140, 141], "right_sin": [140, 141], "right_thigh": [140, 141], "right_upper_arm": [140, 141], "rigid": [140, 141], "risk": 148, "riski": 148, "rl": [9, 17, 148, 156, 157, 159, 162, 164, 167, 170, 171, 173, 174, 176, 177], "rlbook2020": [150, 151, 152], "rmsprop": 178, "rnd": [155, 156], "rng": [2, 3, 5, 6, 7, 9, 10, 155, 156, 166, 175], "road": [128, 156], "roadmap": 156, "robertoschiavon": 156, "robo": 148, "robot": [127, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 161, 167, 169, 171], "robust": [148, 178], "rocket": [129, 148], "rodrigo": 156, "rodrigodelazcano": [155, 156], "rogerjl": 156, "rohan138": 155, "roll": [18, 20, 144, 174], "rolling_length": [164, 174, 178], "rollout": [154, 156], "rom": [155, 156], "ronald": 177, "root": [6, 137, 140, 141, 156], "rooti": [138, 139, 147], "rootx": [138, 139, 147], "rootz": [138, 139, 147], "rotat": [129, 131, 137, 140, 141, 144, 155, 174], "rotor": [137, 138, 139, 140, 141, 146, 147], "roughli": 136, "roulett": 155, "roundtrip": 17, "row": [151, 152, 153, 159, 164, 175], "rpg": 153, "rr": 156, "rstride": 174, "rule": [148, 150, 159, 164, 174], "run": [1, 2, 4, 10, 11, 12, 14, 17, 18, 19, 127, 129, 131, 136, 137, 138, 139, 140, 146, 147, 148, 151, 152, 155, 156, 158, 161, 162, 163, 166, 170, 178], "run_": 1, "run_env": 175, "run_gymnasium_env": 166, "runner": 136, "running_g": 177, "runningmeanstd": [14, 18, 19], "runtim": 178, "runtimeerror": [11, 12, 178], "rushivarora": 155, "rusu24edward": [155, 156], "ryanrud": 155, "r\u00e9mi": 146, "s_": 178, "sab": [150, 164, 174], "safe": [129, 148, 156, 158], "safeti": [148, 155, 156, 159], "sai": [17, 155, 164, 168], "said": [3, 140], "same": [4, 5, 6, 8, 9, 10, 11, 12, 13, 14, 16, 18, 20, 127, 128, 131, 136, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 154, 155, 156, 159, 161, 163, 164, 167, 170, 174, 178], "sampl": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 17, 18, 19, 129, 144, 154, 155, 156, 157, 158, 161, 162, 163, 164, 166, 170, 174, 175, 177, 178], "sample_act": 177, "sample_mask": 6, "sample_n": 5, "sample_phas": 178, "samplefactori": 156, "sander": 156, "saniti": 175, "sarsa": 164, "sashashura": [155, 156], "satisfi": 2, "satur": 148, "save": [14, 17, 155, 156, 158, 162, 164, 168, 175], "save_logg": 9, "save_video": [9, 155], "save_videos1": 17, "save_videos2": 17, "save_videos3": 17, "save_weight": 178, "sb3": 155, "scalabl": 148, "scalar": [7, 14, 16, 155], "scale": [14, 17, 18, 19, 129, 137, 138, 139, 140, 141, 142, 143, 146, 147, 148, 156, 163, 178], "scale_and_shift": 14, "scale_ob": 17, "scenario": [128, 148, 162], "scene": [2, 148, 156, 170], "sched": 148, "schedul": [9, 148, 153], "scheme": 128, "schulhoff": 156, "schulman": [137, 178], "scienc": 164, "scope": [2, 167], "score": [127, 129, 158, 159], "scoreboard": 155, "scratch": [177, 178], "screen": [17, 137, 138, 139, 140, 146, 147, 155, 156, 158], "screen_siz": 17, "script": [1, 148, 162, 174], "sdl": 156, "seaborn": [174, 175, 177], "search": 156, "sebastian": 156, "second": [1, 6, 9, 10, 17, 129, 132, 142, 145, 146, 148, 156, 162, 163, 170], "section": [16, 128, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 166, 174, 175], "see": [1, 2, 5, 6, 9, 10, 11, 12, 17, 128, 129, 131, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 153, 155, 156, 158, 159, 161, 162, 164, 166, 170, 175, 178], "seed": [2, 3, 4, 5, 6, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 131, 132, 133, 134, 135, 136, 155, 156, 157, 158, 159, 162, 166, 175, 177, 178], "seeded_valu": 156, "seem": [158, 175], "seen": [131, 159], "segment": 146, "select": [5, 7, 9, 136, 156, 158, 170, 178], "select_act": 178, "self": [5, 6, 7, 9, 14, 18, 19, 134, 148, 156, 159, 164, 166, 168, 174, 175, 177, 178], "semant": 155, "send": 14, "sens": [7, 159, 170, 175], "sensor": [128, 170], "sent": 155, "separ": [5, 17, 156, 159, 161, 166, 178], "sepsi": 148, "sequenc": [2, 4, 5, 6, 7, 8, 11, 12, 13, 14, 18, 148, 155, 156, 158, 159], "sequenti": [162, 177, 178], "seri": [6, 158], "serial": [12, 178], "serv": [3, 5, 137, 138, 139, 140, 141, 146, 147, 162], "server": 156, "set": [2, 4, 5, 6, 7, 9, 10, 11, 12, 15, 16, 17, 18, 20, 126, 129, 130, 131, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 155, 156, 159, 161, 162, 166, 167, 168, 170, 172, 174, 175, 177, 178], "set_attr": [11, 12, 156], "set_color": 175, "set_linewidth": 175, "set_mod": 166, "set_np_random_through_se": [2, 10], "set_rotate_label": 174, "set_stat": 155, "set_them": 175, "set_titl": [164, 174, 175, 178], "set_vis": 175, "set_wrapper_attr": [15, 156], "set_xlabel": [164, 174, 178], "set_xtick": 175, "set_xticklabel": 174, "set_ylabel": [164, 174], "set_yticklabel": 174, "set_zlabel": 174, "setup": [155, 162], "seungjaeryanle": 155, "seven": 147, "sever": [2, 4, 7, 10, 17, 129, 155, 156, 158, 159, 162, 175], "sfff": 153, "sfffffff": 153, "shape": [2, 5, 6, 7, 8, 10, 11, 13, 14, 16, 17, 18, 20, 131, 132, 133, 134, 135, 137, 140, 141, 150, 151, 152, 153, 154, 155, 156, 158, 159, 166, 168, 175, 177, 178], "share": [5, 11, 156, 162, 177], "shared_featur": 177, "shared_memori": [11, 13], "shared_net": 177, "sheet": 164, "shen": 156, "shift": 7, "shimmi": 156, "shin": [138, 140, 141], "shinrl": 148, "shoot": 11, "short": [136, 155, 161, 164], "shorthand": 155, "should": [1, 2, 5, 7, 9, 10, 11, 12, 13, 14, 17, 136, 145, 155, 156, 158, 159, 163, 164, 166, 167, 168, 170, 174, 178], "shoulder": 144, "shouldn": [156, 159, 166], "show": [3, 136, 150, 155, 156, 158, 161, 162, 164, 166, 168, 170, 171, 173, 174, 175, 176, 177, 178], "showcas": [165, 169, 171, 174], "shown": [128, 131, 167], "shrink_act": 14, "siddarth": [156, 177], "side": [13, 129, 175], "sign": [142, 143, 177], "signal": [2, 17, 137, 139, 140, 147, 154, 158, 166, 167, 175], "signatur": 160, "signific": [148, 156, 160, 161, 162, 170], "significantli": [155, 156, 178], "silenc": 9, "silent": 156, "silver": [175, 178], "sim": [148, 175], "similar": [6, 10, 144, 155, 156, 159, 166], "similarli": [129, 156], "simlat": 136, "simonini": 175, "simoninithoma": 175, "simpl": [127, 148, 149, 157, 158, 161, 162, 164, 167, 177], "simplegrid": 148, "simpler": 158, "simplest": 178, "simpli": [14, 16, 17, 18, 19, 166], "simplic": 148, "simplifi": [135, 155, 156], "simplist": 166, "simul": [2, 136, 140, 141, 142, 143, 148, 156, 159, 174, 175, 177], "simultan": [156, 159], "sin": [129, 135, 142, 145], "sinc": [5, 14, 17, 126, 132, 141, 145, 154, 155, 156, 159, 160, 166, 167, 170, 175], "sine": [131, 142, 145], "singl": [2, 3, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 18, 20, 139, 147, 148, 155, 156, 158, 159, 161, 163, 166, 174, 177], "single_action_spac": [10, 13, 14, 156, 178], "single_func": 14, "single_observation_spac": [10, 11, 14, 156, 178], "single_rgb_arrai": 155, "sinusoid": [133, 134], "site": 155, "situat": [154, 158, 164], "six": 147, "size": [5, 13, 14, 17, 148, 153, 155, 156, 159, 166, 170], "sjmikler": 156, "skeleton": 166, "skill": [159, 162], "skip": [9, 17, 18, 20, 155, 156, 161, 166], "skip_and_max_ob": 18, "skip_close_check": 9, "skip_render_check": 9, "sleep": 129, "slide": [138, 139, 142, 143, 144, 145, 146, 147], "slider": [142, 143], "slider1": 146, "slider2": 146, "slight": 127, "slightli": [9, 127, 136, 137, 140, 141, 142, 145, 164], "slime": 148, "slimevolleygym": 148, "slipperi": [151, 153], "slow": [156, 174], "slowdown": 9, "slower": [129, 164, 178], "small": [127, 148, 149, 155, 156, 159, 164, 177], "smallest": 7, "smart": 148, "smarter": 158, "smooth": [162, 164], "smoother": [155, 174], "sn": [174, 175, 177], "snake_cas": 1, "snippet": [9, 17], "snow": 153, "so": [1, 9, 11, 14, 17, 18, 20, 129, 130, 137, 138, 139, 140, 141, 144, 145, 146, 147, 151, 152, 153, 155, 156, 159, 162, 164, 166, 167, 168, 170, 174, 175, 178], "soft": 148, "softmax": 178, "softrobot": 148, "softwar": [2, 148, 156], "sokoban": 148, "sole": [155, 156, 160], "solut": [129, 156, 174], "solv": [2, 127, 130, 132, 136, 142, 143, 148, 159, 161, 164, 166, 171, 176, 177], "some": [2, 5, 6, 7, 10, 11, 12, 14, 15, 128, 130, 131, 145, 146, 154, 155, 156, 158, 161, 162, 164, 166, 168, 170, 174, 175, 178], "someth": [155, 156, 170], "sometim": [9, 137, 151, 152, 153, 158, 159, 162, 166, 168], "sonelu": 156, "soon": [155, 166], "sophist": [159, 162], "sort": 7, "sourc": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 136, 148, 154, 155, 156, 166, 167, 168, 170, 171, 174, 175, 177, 178], "south": 154, "space": [2, 9, 10, 11, 12, 14, 15, 16, 17, 18, 20, 136, 148, 149, 155, 156, 164, 166, 168, 175, 177, 178], "spacecraft": 148, "spaces_kwarg": 6, "span": 17, "sparisi": 156, "spark": 148, "spars": [131, 159, 166], "spatial": 159, "spawn": [11, 145, 178], "spec": [2, 3, 4, 10, 15, 17, 156], "special": [156, 160, 177], "specialis": 156, "specialist": [160, 163], "specif": [2, 4, 7, 10, 14, 17, 136, 155, 156, 159, 162, 167, 177, 178], "specifi": [2, 5, 6, 7, 9, 14, 16, 17, 18, 20, 126, 127, 128, 129, 130, 135, 137, 138, 139, 140, 141, 143, 146, 147, 149, 153, 154, 155, 156, 158, 161, 162, 166, 168], "speed": [10, 127, 128, 156, 158, 161, 170, 171, 176], "speedup": 178, "spell": 155, "spent": [127, 129], "sphere": 144, "spheric": 145, "sphinx": 1, "spike": 164, "spine": 175, "spinningup": 177, "split": [147, 156], "squar": [17, 144, 145, 154, 156, 159, 166, 175, 178], "squeez": [177, 178], "st": 175, "st_all": 175, "stabil": [14, 18, 19, 140, 141, 155, 159, 164, 168, 177], "stabl": [18, 148, 155, 156, 164, 166, 172], "stable_baselines3": 18, "stack": [6, 17, 18, 20, 156, 177], "stack_siz": 18, "stacked_env": 18, "stage": [17, 156, 162], "stai": [158, 159, 164, 178], "stand": [127, 136, 137, 139, 140, 141, 142, 143, 147, 156, 164, 174], "standard": [18, 19, 148, 155, 156, 157, 164, 177, 178], "standard_norm": 155, "standup": 136, "stare": 162, "start": [1, 2, 5, 7, 9, 11, 13, 17, 136, 156, 157, 158, 161, 162, 164, 174, 175, 177, 178], "start_epsilon": [164, 174], "state": [2, 3, 4, 17, 18, 20, 130, 136, 148, 149, 155, 156, 158, 161, 164, 167, 170, 174, 175, 177, 178], "state_dict": 178, "state_info": 3, "state_s": 175, "state_valu": [174, 178], "state_value_pr": 178, "statefulli": 3, "stateless": [3, 156], "statement": [156, 161], "statetyp": [3, 156], "stationari": 178, "statist": [9, 14, 17, 18, 19, 129, 156, 162, 177], "stats_kei": [14, 17], "std": [14, 162, 164, 177], "std_reward": 162, "stderr": 155, "steer": [128, 159], "stefanbschneid": 156, "step": [2, 3, 4, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 127, 129, 131, 132, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 151, 152, 153, 154, 155, 156, 157, 162, 163, 167, 168, 174, 175, 177, 178], "step_api_compat": [9, 160], "step_async": 156, "step_count": 162, "step_index": 9, "step_info": 3, "step_penalti": 159, "step_return": 9, "step_starting_index": 9, "step_trigg": [9, 17], "step_wait": 156, "stepapicompat": [156, 160], "steppabl": 148, "steps_df": 175, "stick": [150, 174], "sticki": 16, "stickyact": [16, 20, 156], "still": [9, 155, 156, 161, 164, 168, 174, 178], "stochast": [16, 130, 131, 133, 134, 136, 151, 152, 155, 175], "stock": 148, "stool": 153, "stop": [17, 150, 156, 158, 164, 167, 174], "stopiter": 13, "storag": 148, "store": [4, 9, 14, 17, 156, 177], "str": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 174, 175, 177], "straightforward": 161, "strang": 156, "strateg": [133, 134, 159], "strategi": [148, 158, 159, 161, 163, 174], "strict": [2, 155, 156], "strictli": 17, "striker": 155, "string": [2, 4, 5, 7, 9, 14, 18, 155, 156, 158, 159, 166], "stringio": 2, "stronger": 170, "structur": [3, 5, 6, 8, 156, 158, 159, 166], "struggl": 162, "stump": 127, "style": [2, 4, 10, 148, 155, 156, 177], "sub": [6, 10, 11, 12, 14, 156, 163], "subclass": [14, 155], "subject": 146, "submit": [148, 155], "suboptim": 164, "subplot": [164, 174, 175, 178], "subprocess": 11, "subse": 155, "subsect": 170, "subsequ": [6, 155, 161], "subset": [7, 156, 168], "subspac": [5, 6, 7, 8, 14, 18, 155], "substanti": [156, 163], "subtl": 161, "subtract": 178, "succeed": 158, "success": [131, 154, 156, 158, 159, 161, 162, 167], "successfulli": [2, 154, 158, 164, 170], "suffici": [159, 174], "suggest": [155, 164, 178], "suit": [148, 155], "suitabl": [148, 149], "sum": [6, 7, 17, 129, 150, 156, 162, 174, 175, 177], "summaris": 156, "sumo": 148, "super": [2, 14, 15, 148, 155, 159, 166, 168, 177, 178], "superclass": [5, 16, 19], "supersuit": 156, "supertuxkart": 148, "supervis": 164, "suppli": 167, "support": [2, 5, 6, 8, 9, 10, 17, 18, 20, 137, 138, 139, 140, 141, 143, 146, 147, 148, 155, 156, 158, 159, 166], "supportsfloat": [2, 7, 9, 15, 19, 168, 177], "suppos": 9, "suptitl": [174, 178], "sure": [1, 2, 9, 17, 166, 168, 170], "surfac": [142, 143, 147, 166], "surfarrai": 166, "surround": [17, 20], "survei": 163, "suspend": 146, "sutton": [2, 131, 132, 142, 143, 150, 151, 152, 155, 174, 175], "sutton_barto_reward": [132, 156], "swig": [126, 155, 156], "swim": 136, "swimmer": [136, 147, 155], "swing": [131, 135], "swingup": 135, "switch": [155, 156, 158, 161], "symbol": 148, "symptom": 164, "sync": [4, 9, 10, 12, 14, 132, 156], "synchron": [10, 11, 12, 156], "synchronizedarrai": 13, "syncvectorenv": [4, 10, 132, 156, 159, 163, 178], "syntax": 4, "synthes": 148, "synthesi": [140, 141], "system": [131, 135, 136, 142, 155, 156, 159, 166], "system_check": 6, "systemat": [162, 164], "t": [1, 2, 4, 5, 6, 8, 9, 14, 15, 17, 128, 129, 133, 134, 154, 155, 156, 158, 159, 161, 162, 164, 166, 167, 174, 175, 178], "t_cov": [5, 13], "tabl": [155, 164], "tabular": [148, 164, 171, 176], "tag": 148, "tai": 156, "tailkind": 9, "take": [1, 2, 3, 4, 7, 8, 9, 10, 11, 16, 17, 130, 132, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 154, 155, 158, 159, 164, 168, 174, 175, 177, 178], "taken": [10, 17, 18, 20, 130, 132, 158, 162, 163, 166, 172, 177, 178], "talk": [163, 164, 177], "tall": 137, "tan": 156, "tanh": [129, 177], "target": [18, 131, 136, 144, 145, 154, 159, 161, 164, 166, 167, 168, 178], "target_devic": [14, 17], "target_dur": 9, "target_i": [145, 159], "target_posit": 168, "target_x": [145, 159], "target_xp": [14, 17], "task": [2, 6, 15, 128, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 158, 159, 161, 166, 167, 168, 175, 177], "tassa": [139, 140, 141], "tau": 135, "taxi": [149, 155, 156], "taxi_col": 154, "taxi_row": 154, "td": [175, 178], "td3": 172, "td_error": 178, "teach": [158, 164], "team": [155, 156], "technic": [16, 156], "techniqu": [17, 20, 162], "techreport": [133, 134], "tell": [158, 164, 167, 172, 174], "templat": [3, 166], "tempor": 164, "temporal_differ": [164, 174], "temporarili": [13, 164], "ten": [150, 174], "tendon": [140, 141], "tendon_length": [140, 141], "tendon_veloc": [140, 141], "tensor": [14, 17, 20, 177, 178], "term": [2, 14, 18, 130, 131, 136, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 159, 164, 166, 168, 178], "termin": [2, 3, 9, 10, 11, 12, 14, 17, 18, 19, 20, 131, 132, 133, 134, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 162, 164, 166, 168, 174, 175, 177, 178], "terminal_observ": 155, "terminal_on_life_loss": 17, "terminaltyp": [3, 156], "terminate_when_unhealthi": [137, 139, 140, 147, 170], "terminationwrapp": 170, "terrain": [127, 148, 170], "terri": 156, "terribli": 155, "test": [9, 17, 127, 148, 155, 156, 158, 162, 166, 170, 177], "test_ag": 164, "tetri": 148, "text": [2, 5, 7, 8, 13, 150, 151, 152, 153, 154, 155, 156, 158], "textencod": 155, "th": [17, 18, 20], "than": [1, 4, 6, 16, 129, 131, 132, 133, 134, 143, 144, 150, 155, 156, 158, 159, 162, 164, 170, 174, 175, 178], "thank": 156, "theden": 155, "thei": [5, 11, 17, 20, 136, 149, 150, 151, 152, 153, 155, 156, 159, 161, 163, 166, 170, 178], "theirfor": 178, "them": [3, 5, 14, 15, 17, 129, 137, 138, 145, 148, 154, 155, 156, 160, 161, 168, 170, 178], "themselv": 148, "theo": 156, "theorem": 148, "theoret": [148, 155, 156, 164], "theori": [135, 142, 155, 158, 175, 178], "therefor": [2, 5, 17, 137, 140, 141, 145, 147, 155, 156, 171, 173, 176], "thesi": [133, 134, 146], "theta": [135, 155], "theta1": 131, "theta2": 131, "theta_dt": 135, "thi": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 162, 163, 164, 166, 167, 168, 170, 172, 174, 175, 177, 178], "thigh": [138, 139, 140, 141, 147], "thigh_joint": [139, 147], "thigh_left_joint": 147, "thing": [13, 15, 155, 164, 168], "think": [13, 148, 158], "third": [137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 166], "third_party_environ": 155, "thoma": 175, "thoroughli": 159, "those": [13, 14, 131, 155, 159, 168, 175, 178], "though": [6, 11, 155], "thought": [155, 156, 164], "thousand": [156, 162], "thousandth": 17, "thread": 156, "three": [5, 6, 15, 139, 140, 141, 146, 155, 156, 159, 166], "threshold": [4, 131, 132, 154, 166], "throttl": [129, 159], "through": [2, 3, 4, 5, 10, 11, 12, 14, 17, 18, 20, 140, 141, 148, 155, 156, 157, 158, 159, 160, 163, 164, 167], "throw": [156, 168], "thrower": 155, "thrown": 7, "thruster": 129, "thu": [11, 137, 140, 141, 142, 156, 178], "thytu": 156, "ti": 175, "tick": 166, "tight_layout": [164, 174, 175, 178], "tile": [128, 153, 175], "tileset": 153, "till": [174, 178], "till2": 156, "tilleri": 153, "tilt": 129, "tim": 175, "time": [1, 2, 5, 6, 9, 10, 14, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 128, 132, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 151, 152, 154, 155, 156, 158, 159, 161, 162, 163, 164, 166, 169, 170, 171, 172, 174, 177, 178], "time_limit": [153, 154], "time_queu": [14, 17, 162], "timeawareobserv": [10, 18, 20, 156, 158], "timelaps": 162, "timelimit": [2, 4, 15, 17, 20, 127, 128, 129, 131, 132, 133, 134, 135, 156, 158, 166, 167], "times10": [137, 140, 141], "timestamp": 2, "timestep": [2, 17, 18, 20, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 158, 159, 166, 170, 177, 178], "timgates42": 155, "timschneider42": 156, "tip": [138, 142, 146, 147], "tips_arm": 144, "titl": [9, 133, 134, 156, 162, 174, 175, 177], "tmrl": 148, "to_json": [5, 156], "to_torch": 156, "tobirohr": 156, "toctre": 1, "todorov": [139, 140, 141], "togeth": [5, 12, 136, 161, 175], "toi": [126, 150, 151, 152, 153, 154, 155], "tom": 154, "toml": 166, "ton": 155, "too": [137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 158, 159, 170, 175], "took": 162, "tool": [137, 138, 139, 140, 141, 143, 146, 147, 148, 158, 162], "toolbox": 148, "toolkit": 148, "top": [128, 129, 130, 133, 134, 139, 142, 143, 147, 148, 155, 156, 159, 166, 175, 177], "torch": [2, 14, 17, 20, 156, 177, 178], "torqu": [127, 129, 131, 135, 137, 138, 139, 140, 141, 144, 145, 146, 147], "torso": [137, 138, 139, 140, 141, 147, 170], "toss": 7, "total": [2, 127, 128, 129, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 154, 158, 162, 164, 175, 177, 178], "total_episod": 175, "total_num_episod": 177, "total_reward": [158, 164, 175], "total_timestep": 156, "touch": [14, 159, 166], "touretzki": 131, "toward": [146, 155, 164], "tower": 156, "towers2024gymnasium": 156, "towers_gymnasium_2023": 156, "town": 156, "toy_text": [153, 155, 174, 175], "tpu": 163, "tqdm": [164, 174, 175, 178], "trace": [127, 156], "traceback": [13, 17], "track": [9, 14, 17, 20, 128, 132, 137, 138, 139, 140, 146, 147, 148, 156, 164], "trackmania": 148, "trade": [148, 156, 158, 159], "tradeoff": 178, "traffic": 148, "train": [10, 137, 140, 141, 142, 145, 148, 155, 156, 158, 159, 161, 172, 175], "training_env": 161, "training_error": [164, 174], "training_error_moving_averag": [164, 174], "training_period": 162, "training_video": 162, "trajectori": [14, 18, 19, 129, 140, 141], "transfer": [14, 17, 148, 163], "transform": [3, 5, 8, 9, 14, 15, 16, 18, 19, 20, 145, 168], "transformact": [14, 16, 20], "transformob": 156, "transformobserv": [14, 18, 20], "transformreward": [14, 19, 20], "transit": [3, 9, 140, 141, 151, 152, 153, 154, 156, 157, 167, 178], "transition_info": 3, "translat": [137, 140, 141, 156, 159, 166], "transport": 148, "transpos": [9, 166], "treasur": 175, "treat": 158, "treatment": 148, "tremend": 155, "trend": 162, "tri": 156, "trial": [158, 164], "trigaten": 155, "trigger": [9, 17, 154, 162], "tristan": 156, "tristandeleu": 155, "trivial": [158, 159, 166], "true": [2, 4, 6, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 127, 128, 132, 136, 137, 138, 139, 140, 141, 146, 147, 150, 153, 154, 155, 156, 158, 160, 162, 164, 166, 170, 174, 175, 177, 178], "true_": [16, 18], "trunc": [14, 18], "truncat": [2, 4, 9, 10, 11, 12, 14, 17, 18, 19, 20, 128, 131, 132, 133, 134, 153, 154, 155, 156, 157, 158, 159, 160, 162, 164, 166, 168, 170, 174, 175, 177, 178], "trunk": 170, "try": [141, 148, 155, 156, 158, 159, 164, 174], "tuckerbmorgan": 155, "tune": [148, 177], "tupl": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 137, 139, 140, 147, 150, 155, 156, 158, 159, 161, 164, 166, 174, 177, 178], "turbotimon": 156, "turbul": [129, 155], "turbulence_pow": [129, 178], "turn": [9, 11, 17, 128, 129, 142, 148, 155, 156], "tutori": [2, 15, 156, 159, 161, 162, 164, 165, 166, 167, 168, 169, 170, 173, 174, 175, 176, 177, 178], "tutorials_jupyt": 171, "tutorials_python": 171, "tweak": [136, 146], "two": [2, 5, 6, 7, 9, 10, 17, 18, 20, 127, 129, 131, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 145, 146, 147, 148, 150, 155, 156, 159, 162, 163, 166, 174, 178], "txt": [1, 155], "type": [2, 4, 5, 6, 7, 10, 14, 16, 17, 18, 20, 128, 132, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 159, 161, 166, 168, 175, 177], "typeerror": 156, "typic": [2, 9, 154, 159, 162, 170], "typo": [155, 156], "u": [5, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 159, 164, 166, 168, 174, 177], "uav": 148, "uint8": [18, 128], "un": 132, "unattach": [144, 145], "unbound": [7, 18], "uncertain": 148, "uncertainti": 148, "unclear": [156, 159], "uncom": 170, "uncommon": 156, "undefin": 2, "under": [2, 156, 174, 177], "underli": [2, 15, 17, 131, 156, 158], "underneath": [15, 132, 158], "underpow": 130, "underscor": [155, 161], "understand": [2, 8, 10, 144, 156, 159, 161], "undocu": 156, "uneven": 127, "unexpect": [11, 129, 155], "unflatten": [5, 8, 156], "unhealthi": [137, 139, 140, 142, 143, 147], "unicod": 9, "uniform": [5, 7, 8, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 175], "uniformli": [7, 131, 132, 154, 166], "uniniti": 159, "unintend": 156, "union": [6, 7, 19, 156], "uniqu": [6, 10, 126, 130, 136, 142, 155, 161], "unit": [5, 14, 18, 20, 129, 131, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148], "uniti": 148, "unitless": [142, 145], "unitre": 170, "unitree_go1": 170, "univers": [133, 134, 175], "unknown": [2, 9, 10, 148, 158], "unless": [7, 15, 150, 151, 152, 153, 154, 155, 166], "unlik": [6, 164, 177], "unmaintain": 156, "unnecessari": [155, 156], "unnecessarili": 161, "unnescesari": 155, "unord": 5, "unpack": 161, "unpickl": [9, 13, 155, 156], "unplay": 9, "unreli": 161, "unsupport": 7, "untermin": 132, "until": [17, 144, 150, 151, 152, 153, 155, 156, 158, 164, 166, 175, 177, 178], "unus": [155, 159], "unusu": 162, "unwrap": [2, 10, 15, 131, 156, 158, 159], "up": [2, 6, 7, 10, 127, 129, 136, 137, 139, 140, 141, 147, 150, 151, 152, 153, 154, 156, 158, 159, 162, 164, 166, 170, 171, 174, 175, 176], "updat": [1, 2, 3, 9, 14, 16, 17, 18, 19, 137, 139, 140, 147, 154, 155, 156, 158, 159, 160, 166, 167, 168, 174, 175, 177, 178], "update_paramet": 178, "update_q_valu": 161, "update_running_mean": [18, 19], "upfront": 161, "upgrad": [155, 156], "uph": 141, "uph_cost": 141, "uph_cost_weight": 141, "upload": 162, "upon": [133, 134, 161], "upper": [7, 14, 19, 20, 140, 141, 155, 158], "upright": [132, 135, 142, 143, 158], "upsid": 156, "upstream": 156, "urandom": 2, "urban": 148, "urdf": 170, "url": [155, 156, 178], "urldat": 156, "us": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 126, 127, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 153, 154, 155, 156, 158, 160, 162, 163, 164, 167, 168, 170, 171, 174, 176], "usabl": [150, 155, 164, 174], "usable_ac": [164, 174], "usag": [9, 156, 159, 161, 162, 164, 168], "use_contact_forc": [137, 156], "use_cuda": 178, "useless": 170, "user": [2, 3, 4, 5, 9, 10, 12, 14, 18, 20, 131, 132, 133, 134, 135, 155, 156, 158, 161, 165, 166, 169, 171, 177], "usual": [2, 6, 7, 17, 139, 158, 164, 166, 168, 170, 174, 178], "util": [18, 148, 155, 156, 158, 159, 160, 161, 166, 178], "utilis": [10, 155], "utli": 156, "v": [4, 133, 134, 161, 178], "v0": [2, 4, 9, 10, 14, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 159, 166, 167, 172, 177], "v1": [2, 4, 9, 10, 11, 12, 14, 16, 17, 18, 19, 127, 128, 129, 131, 132, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 158, 160, 162, 164, 172, 174, 175], "v2": [127, 128, 129, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156], "v21": [155, 156], "v24": 155, "v25": 155, "v26": [2, 156, 177], "v28": 156, "v2g": 148, "v3": [9, 14, 17, 18, 127, 128, 129, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 157, 158, 161, 168, 178], "v4": [14, 15, 16, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 172, 177], "v5": [17, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 161, 170], "vairodp": 156, "val": 175, "valentin": 156, "valid": [2, 4, 5, 7, 10, 13, 14, 158, 164, 174, 178], "vallei": [133, 134], "valu": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 127, 129, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 158, 161, 164, 166, 167, 170, 174, 175, 177, 178], "value_funct": 161, "value_grid": 174, "value_pr": 178, "valueerror": [7, 8, 11, 12, 13, 17], "vampir": 148, "var": 19, "vari": [132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 177], "variabl": [2, 5, 7, 11, 13, 14, 15, 17, 136, 137, 139, 146, 147, 148, 155, 156, 158, 166, 167, 174, 177], "varianc": [14, 18, 19, 20, 178], "variant": [128, 166], "variat": 136, "varieti": [9, 148], "variou": [5, 141, 148, 155, 177], "ve": [155, 156, 159, 164], "vec_env": [9, 159], "vecenvwrapp": 155, "vector": [2, 4, 7, 9, 11, 12, 16, 17, 18, 19, 127, 129, 142, 143, 145, 148, 155, 156, 158, 159, 162, 171, 176, 177], "vector_a2c": 178, "vector_entry_point": [4, 132, 156], "vector_env": 14, "vector_kwarg": 4, "vector_list_info": 155, "vectoractionwrapp": [14, 156], "vectorenv": [4, 5, 14, 155, 156], "vectorenvcr": 4, "vectorenvwrapp": 156, "vectoris": [5, 148], "vectorization_mod": [4, 9, 10, 11, 12, 14, 132, 156], "vectorizemod": 4, "vectorizetransformact": [14, 20], "vectorizetransformobserv": [14, 20], "vectorizetransformreward": [14, 20], "vectorizor": [4, 132], "vectorlistinfo": [14, 155, 156], "vectorobservationwrapp": [14, 156], "vectorrewardwrapp": [14, 156], "vectorwrapp": [14, 156], "vehicl": 148, "veloc": [2, 8, 13, 127, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 158, 159], "velocity_penalti": 142, "veri": [6, 129, 144, 155, 156, 158, 159, 163, 164, 166, 178], "verifi": [9, 159, 161, 164], "vermouth1992": [155, 156], "versa": [13, 17, 18], "version": [1, 2, 4, 5, 14, 16, 17, 18, 19, 148, 155, 156, 159, 161, 164, 166, 167, 168, 170, 174, 175, 177, 178], "vertic": [127, 139, 141, 142, 143, 147, 159, 166], "vf_next_stat": 167, "vf_target": 167, "via": [5, 9, 14, 15, 17, 126, 130, 136, 148, 149, 158, 166, 177], "viabl": 174, "vicbentu": 156, "vice": [13, 17, 18], "vicent": 156, "video": [1, 17, 20, 127, 155, 156, 158, 159, 162, 164, 170, 172, 175], "video0": 170, "video_fold": [9, 17, 162], "video_length": [9, 17], "video_path": 162, "videorecord": [17, 155, 156], "view": [2, 156, 159, 170], "view_init": 174, "viewer": [10, 11, 12, 156], "viewport": 129, "viewport_h": 129, "viewport_w": 129, "virgilt": 155, "viridi": 174, "viscou": 146, "visibl": 166, "visit": [128, 175], "visual": [148, 158, 159, 161, 162, 164, 170], "visual_env": 161, "visual_opt": [136, 156], "visualis": 2, "vizdoom": 148, "vmoen": [155, 156], "voidflight": 156, "vol": [131, 154], "volleybal": 148, "volunt": 156, "vscode": [156, 172], "vwxyzjn": 155, "vx": [14, 17, 129], "vy": 129, "w": [9, 137, 140, 141, 178], "w_": [137, 138, 139, 140, 141, 144, 145, 146, 147], "wa": [2, 4, 6, 9, 10, 14, 17, 18, 19, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 159, 160, 161, 164, 167, 168, 177, 178], "wai": [2, 13, 15, 17, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 164, 167, 168, 174, 175, 178], "wait": [9, 10, 11, 155, 167], "wait_on_play": 9, "wake": 129, "walk": [136, 140, 147, 149, 153, 156, 159, 166, 170], "walker": [126, 145, 147, 155], "walker2d": [136, 156], "walker2d_v5": 147, "wall": [133, 134, 154, 159, 162], "wandb": 162, "want": [1, 2, 4, 6, 11, 15, 17, 137, 140, 141, 155, 156, 158, 159, 161, 162, 166, 168, 170, 174, 175, 178], "ward": 177, "warehous": 148, "warn": [6, 9, 10, 11, 17, 144, 155, 156], "wasn": 17, "watch": [1, 162, 164, 172], "water": 148, "wawrzy\u0144ski": 138, "we": [1, 2, 3, 4, 5, 7, 9, 13, 18, 148, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 166, 167, 168, 170, 174, 177, 178], "web": 148, "websit": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 136, 155, 156], "weigh": 137, "weight": [137, 138, 139, 140, 141, 144, 145, 146, 147, 148, 155, 162, 167, 168, 177], "well": [2, 5, 14, 131, 148, 155, 159, 164, 166, 175, 178], "were": [126, 131, 136, 154, 155, 156, 161, 164, 166, 170, 178], "weren": 161, "west": 154, "what": [2, 5, 6, 148, 151, 152, 156, 159, 162, 163], "wheel": [126, 128, 155], "when": [2, 4, 5, 8, 9, 10, 11, 12, 13, 14, 17, 18, 20, 128, 129, 137, 139, 140, 141, 142, 143, 144, 147, 151, 152, 153, 154, 155, 156, 158, 159, 160, 161, 164, 166, 167, 168, 170, 175, 177, 178], "whenev": [17, 129, 166], "where": [1, 4, 6, 7, 8, 9, 14, 17, 128, 129, 131, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 162, 163, 164, 166, 167, 168, 170, 174, 175, 177, 178], "wherea": 175, "whether": [2, 3, 4, 5, 7, 9, 15, 17, 129, 137, 138, 139, 140, 141, 146, 147, 148, 150, 158, 159, 164, 166, 167, 174, 177], "which": [1, 2, 4, 5, 8, 9, 10, 14, 17, 18, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 161, 163, 166, 167, 168, 170, 172, 175, 177, 178], "while": [4, 8, 9, 11, 14, 17, 18, 19, 129, 131, 132, 135, 137, 140, 141, 146, 150, 151, 152, 155, 158, 159, 161, 162, 164, 166, 167, 174, 175, 177, 178], "white": 155, "who": 156, "whole": [4, 155, 156, 170], "whose": [137, 150], "why": [129, 164], "wide": [148, 158], "width": [136, 156, 166], "wikipedia": 175, "wildli": 164, "willdudlei": 156, "william": [133, 134, 177], "win": [150, 164, 174], "win_rat": 164, "wind": [129, 155, 156], "wind_pow": [129, 155, 178], "window": [2, 9, 128, 136, 155, 156, 158, 161, 162, 164, 166], "window_s": 166, "wing": 148, "wire": 148, "wireless": 148, "wise": 177, "wish": [9, 155, 156], "within": [2, 5, 7, 9, 13, 14, 16, 17, 18, 20, 129, 130, 143, 155, 156, 158, 159], "without": [14, 15, 17, 19, 140, 148, 150, 153, 155, 156, 158, 159, 164, 166, 170, 174], "won": [2, 164, 174], "word": [144, 177], "work": [5, 9, 128, 129, 131, 138, 139, 142, 143, 148, 155, 156, 158, 159, 161, 164], "worker": 11, "workflow": 156, "workshop": 148, "world": [129, 148, 151, 152, 153, 154, 156, 175], "worldbodi": [137, 140, 141], "worri": 166, "wors": [155, 164], "would": [6, 8, 16, 18, 19, 137, 138, 139, 140, 146, 147, 155, 156, 157, 166, 168, 170, 178], "wouldn": 156, "wrap": [2, 4, 9, 11, 12, 14, 15, 16, 17, 18, 19, 20, 148, 158, 159, 166, 168, 177, 178], "wrapped_env": [14, 15, 16, 17, 18, 158, 159, 166, 168, 177], "wrapped_env_ob": 16, "wrapped_obs0": 18, "wrapped_obs1": 18, "wrappedenvacttyp": 156, "wrappedenvobstyp": 156, "wrapper": [2, 4, 6, 7, 9, 10, 13, 137, 138, 139, 140, 141, 143, 146, 147, 148, 153, 154, 155, 156, 157, 158, 160, 162, 164, 169, 171, 174, 177, 178], "wrapper_spec": 15, "wrapperacttyp": [15, 16], "wrapperobstyp": [15, 18], "wrapperspec": [4, 15], "wrist": 144, "write": [5, 11, 13, 156, 159, 166, 170], "write_to_shared_memori": [5, 13], "written": [9, 156, 163], "wrong": [155, 156, 158, 159, 161, 164], "www": [128, 150, 151, 152, 153, 155], "x": [2, 5, 8, 14, 129, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 151, 152, 156, 159, 162, 166, 175, 177, 178], "x_": [137, 138, 139, 140, 142, 146, 147], "x_init": 133, "x_posit": [14, 137, 138, 139, 140, 141, 146, 147], "x_veloc": 14, "xlabel": 162, "xml": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 170], "xml_file": [136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 170], "xp": 14, "xpo": [137, 140, 144, 145], "xtick": 174, "xticklabel": 175, "xuanhien070594": 156, "xuehaipan": [155, 156], "xx": 175, "xy": 142, "y": [2, 129, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 154, 159, 175, 177], "y_": 142, "y_coordin": 142, "y_init": 133, "y_posit": [137, 138, 139, 140, 141, 146, 147], "yaniv": 156, "year": [133, 134, 155, 156], "yellow": 154, "yet": [148, 156], "yield": 13, "ylabel": [162, 175], "you": [1, 2, 5, 6, 7, 8, 9, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 128, 137, 140, 141, 148, 155, 156, 157, 158, 161, 162, 164, 166, 167, 168, 170, 172, 175, 178], "youjiacheng": 155, "youni": [155, 156], "younik": [155, 156], "your": [1, 2, 5, 9, 11, 14, 15, 16, 17, 18, 128, 137, 140, 141, 148, 155, 156, 157, 163, 168, 169, 171, 174, 178], "your_env": 9, "yourself": [11, 128, 159, 166, 174], "ytick": 174, "yticklabel": 175, "z": [137, 138, 139, 140, 141, 142, 144, 145, 147], "z_": 141, "z_distance_from_origin": [139, 141, 147], "zaxi": 174, "zemann": [174, 178], "zenodo": 156, "zero": [7, 13, 18, 135, 137, 139, 140, 141, 147, 156, 164, 166, 167, 174, 175, 177, 178], "zero_grad": [177, 178], "zhiqingxiao": 155, "zip": 171, "zlig": 155, "zoom": 9, "zuoxingdong": 155, "zzyunzhi": 155}, "titles": ["404 - Page Not Found", "Gymnasium-docs", "Env", "Functional Env", "Make and register", "Spaces", "Composite Spaces", "Fundamental Spaces", "Spaces Utils", "Utility functions", "Vectorize", "AsyncVectorEnv", "SyncVectorEnv", "Utility functions", "Wrappers", "Wrappers", "Action Wrappers", "Misc Wrappers", "Observation Wrappers", "Reward Wrappers", "List of Wrappers", "Atari", "Adventure", "Air Raid", "Alien", "Amidar", "Assault", "Asterix", "Asteroids", "Atlantis", "Atlantis2", "Backgammon", "Bank Heist", "Basic Math", "Battle Zone", "Beam Rider", "Berzerk", "Blackjack", "Bowling", "Boxing", "Breakout", "Carnival", "Casino", "Centipede", "Chopper Command", "Crazy Climber", "Crossbow", "Darkchambers", "Defender", "Demon Attack", "Donkey Kong", "Double Dunk", "Earthworld", "Elevator Action", "Enduro", "Entombed", "Et", "Fishing Derby", "Flag Capture", "Freeway", "Frogger", "Frostbite", "Galaxian", "Gopher", "Gravitar", "Hangman", "Haunted House", "Hero", "Human Cannonball", "Ice Hockey", "Jamesbond", "Journey Escape", "Kaboom", "Kangaroo", "Keystone Kapers", "King Kong", "Klax", "Koolaid", "Krull", "Kung Fu Master", "Laser Gates", "Lost Luggage", "Mario Bros", "Miniature Golf", "Montezuma Revenge", "Mr Do", "Ms Pacman", "Name This Game", "Othello", "Pacman", "Phoenix", "Pitfall", "Pitfall2", "Pong", "Pooyan", "Private Eye", "Qbert", "Riverraid", "Road Runner", "Robotank", "Seaquest", "Sir Lancelot", "Skiing", "Solaris", "Space Invaders", "Space War", "Star Gunner", "Superman", "Surround", "Tennis", "Tetris", "Tic Tac Toe 3D", "Time Pilot", "Trondead", "Turmoil", "Tutankham", "Up N Down", "Venture", "Video Checkers", "Video Chess", "Video Cube", "Video Pinball", "Wizard Of Wor", "Word Zapper", "Yars Revenge", "Zaxxon", "Box2D", "Bipedal Walker", "Car Racing", "Lunar Lander", "Classic Control", "Acrobot", "Cart Pole", "Mountain Car", "Mountain Car Continuous", "Pendulum", "MuJoCo", "Ant", "Half Cheetah", "Hopper", "Humanoid", "Humanoid Standup", "Inverted Double Pendulum", "Inverted Pendulum", "Pusher", "Reacher", "Swimmer", "Walker2D", "External Environments", "Toy Text", "Blackjack", "Cliff Walking", "Cliff Walking Slippery", "Frozen Lake", "Taxi", "Gym Release Notes", "Gymnasium Release Notes", "<no title>", "Basic Usage", "Create a Custom Environment", "Compatibility with Gym", "Migration Guide - v0.21 to v1.0.0", "Recording Agents", "Speeding Up Training", "Training an Agent", "Gymnasium Basics", "Make your own custom environment", "Handling Time Limits", "Implementing Custom Wrappers", "Gymnasium Basics", "Load custom quadruped robot environments", "Tutorials", "Third-Party Tutorials", "Training Agents", "Solving Blackjack with Tabular Q-Learning", "Solving Frozenlake with Tabular Q-Learning", "Training Agents", "Training using REINFORCE for Mujoco", "Speeding up A2C Training with Vector Envs"], "titleterms": {"0": [155, 156, 161, 170], "0a1": 156, "0a2": 156, "1": [155, 156, 161, 170], "11": 175, "12": 155, "19": 155, "2": [155, 156, 161, 170], "20": 155, "21": [155, 160, 161], "22": 155, "23": 155, "24": 155, "25": 155, "26": [155, 156, 161], "27": 156, "28": 156, "29": 156, "3": [155, 156, 161, 170], "3d": 111, "4": [155, 161, 170, 175], "404": 0, "5": [155, 161], "6": 155, "7": [155, 175], "9": [155, 175], "Not": 0, "Of": 122, "The": [0, 161, 164, 175], "__init__": 159, "a2c": 178, "about": [159, 164, 172], "acrobot": 131, "across": 136, "action": [14, 16, 53, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159, 164, 174], "actionwrapp": 168, "actor": 178, "ad": [1, 159], "add": 159, "addit": [4, 10, 11, 12], "advanc": 159, "advantag": 178, "adventur": 22, "agent": [158, 162, 164, 170, 171, 173, 174, 176, 177, 178], "agilerl": 172, "air": 23, "algorithm": 163, "alien": 24, "alpha": 156, "alpha1": 156, "altern": 166, "amidar": 25, "an": [1, 164, 174, 177], "analysi": 178, "analyz": 164, "ant": 137, "api": [9, 160, 161], "argument": [127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "assault": 26, "asterix": 27, "asteroid": 28, "asynchron": 178, "asyncvectorenv": 11, "atari": 21, "atlanti": 29, "atlantis2": 30, "attack": 49, "attribut": [2, 5, 10, 15], "autonom": 148, "avail": 16, "backend": 136, "backgammon": 31, "bank": 32, "base": [3, 16], "basic": [33, 158, 165, 169, 171], "battl": 34, "beam": 35, "befor": 159, "beginn": 158, "benchmark": 9, "benefit": 162, "berzerk": 36, "best": 162, "better": 174, "biolog": 148, "biped": 127, "blackjack": [37, 150, 164, 174], "boundari": 159, "bowl": 38, "box": 39, "box2d": 126, "breakdown": 161, "breakout": 40, "bro": 82, "build": [1, 164, 174, 177], "can": 174, "cannonbal": 68, "captur": 58, "car": [128, 133, 134], "carniv": 41, "cart": 132, "casino": 42, "centiped": 43, "chang": 161, "check": [9, 159], "checker": 118, "cheetah": 138, "chess": 119, "chopper": 44, "class": 16, "classic": 130, "cliff": [151, 152], "climber": 45, "close": 166, "code": [158, 159, 161, 167, 172], "command": 44, "common": [14, 17, 158, 159, 164], "compar": 136, "comparison": 161, "compat": [9, 160, 161], "complet": 161, "complex": 159, "composit": [5, 6], "comput": 148, "construct": [159, 166], "continu": 134, "control": 130, "convers": [14, 17], "convert": 3, "core": 4, "could": 0, "crazi": 45, "creat": [2, 159, 166, 175], "credit": [127, 128, 129], "critic": 178, "crossbow": 46, "cube": 120, "curv": 177, "custom": [159, 166, 168, 170], "darkchamb": 47, "data": [14, 17], "debug": 159, "declar": 166, "deep": 161, "defend": 48, "demon": 49, "derbi": 57, "descript": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "design": 159, "did": 161, "do": [85, 174], "doc": 1, "document": 1, "domain": 178, "done": 161, "donkei": 50, "doubl": [51, 142], "down": 116, "download": 170, "drive": 148, "dunk": 51, "dure": [162, 164], "dynam": [133, 134], "earthworld": 52, "econom": 148, "edit": 1, "electr": 148, "elev": 53, "end": [131, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "enduro": 54, "energi": 148, "entomb": 55, "env": [2, 3, 166, 178], "environ": [1, 2, 3, 9, 10, 132, 148, 158, 159, 160, 161, 163, 164, 166, 170, 174, 175, 178], "epilogu": 170, "episod": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 162], "error": 159, "escap": 71, "et": 56, "evalu": 162, "everi": 162, "exact": 136, "exampl": 159, "execut": [164, 174], "expect": 164, "experi": 162, "explain": 158, "exploit": 164, "explor": 164, "extern": 148, "ey": 95, "featur": 159, "financi": 148, "first": [148, 158], "fish": 57, "flag": 58, "found": 0, "framework": 161, "freecodecamp": 172, "freewai": 59, "frogger": 60, "from": [166, 168, 172], "frostbit": 61, "frozen": 153, "frozenlak": 175, "fu": 79, "function": [3, 4, 5, 9, 13, 159, 161], "fundament": [5, 7], "galaxian": 62, "game": [87, 148], "gate": 80, "gener": [161, 166], "get": [161, 164], "golf": 83, "gopher": 63, "gradual": 159, "gravitar": 64, "gridworld": 159, "guid": 161, "gunner": 106, "gym": [148, 155, 160], "gymnasium": [1, 10, 148, 156, 158, 165, 166, 168, 169, 171, 172], "half": 138, "handl": [159, 167], "hangman": 65, "haunt": 66, "heist": 32, "help": 161, "helper": 161, "hero": 67, "heurist": 163, "histori": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "hockei": 69, "hopper": 139, "hous": 66, "human": 68, "humanoid": [140, 141], "i": 158, "ic": 69, "implement": [2, 14, 18, 19, 168], "import": [167, 174], "improv": 164, "includ": 161, "inform": [150, 151, 152, 153, 154, 162], "inherit": 168, "initi": [156, 158, 166], "instanc": 166, "instruct": 1, "integr": 162, "interpret": 164, "introduct": 178, "intuit": 164, "invad": 104, "invert": [142, 143], "issu": [158, 159, 164], "jamesbond": 70, "jax": 3, "johnni": 172, "journei": 71, "kaboom": 72, "kangaroo": 73, "kaper": 74, "kei": [159, 161], "keyston": 74, "king": 75, "klax": 76, "known": 159, "kong": [50, 75], "koolaid": 77, "krull": 78, "kung": 79, "lake": 153, "lancelot": 101, "lander": 129, "laser": 80, "learn": [158, 159, 161, 164, 167, 174, 175, 177], "librari": 172, "limit": 167, "list": 20, "ll": 175, "load": [160, 170, 178], "loop": [158, 164], "lost": 81, "luggag": 81, "lunar": 129, "m": 86, "make": [4, 10, 159, 166], "manual": 159, "map": 175, "mario": 82, "master": 79, "math": 33, "mathemat": 148, "medic": 148, "memori": 13, "method": [2, 5, 10, 11, 12, 15], "migrat": 161, "miniatur": 83, "misc": 17, "miscellan": 13, "mode": 161, "model": 170, "modifi": [1, 158], "montezuma": 84, "more": 162, "mountain": [133, 134], "mr": 85, "mujoco": [136, 177], "n": 116, "name": [87, 161], "network": 177, "never": 164, "new": [1, 9, 161], "next": [158, 159, 164], "note": [129, 146, 155, 156], "notic": 178, "number": 161, "observ": [14, 18, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159, 166, 170, 174], "observationwrapp": 168, "old": [9, 161], "onli": [14, 20], "openai": 160, "optim": 163, "othello": 88, "other": [1, 148], "output": 162, "own": 166, "packag": [161, 166], "pacman": [86, 89], "page": [0, 1], "paramet": [170, 175], "parameter": 159, "parti": [148, 172], "pendulum": [135, 142, 143], "perform": [9, 136, 178], "period": 162, "phoenix": 90, "pickl": 9, "pilot": 112, "pinbal": 121, "pitfal": [91, 159], "pitfall2": 92, "plai": 178, "plot": [177, 178], "pole": 132, "polici": [174, 177], "pong": 93, "poor": 164, "pooyan": 94, "practic": 162, "privat": 95, "problem": 159, "process": 164, "program": 158, "pusher": 144, "q": [161, 164, 174, 175], "qbert": 96, "quadrup": 170, "question": 159, "quick": 161, "race": 128, "raid": 23, "random": [161, 178], "reacher": 145, "read": 161, "real": 159, "recommend": 166, "record": 162, "refer": [128, 131, 150, 151, 152, 154, 161, 175, 177, 178], "regist": [4, 159, 166], "reinforc": [158, 177], "releas": [155, 156], "remov": 161, "render": [9, 136, 159, 161, 166], "represent": 159, "reproduc": 136, "request": 0, "research": 159, "reset": [128, 159, 161, 166], "result": 164, "reveng": [84, 124], "reward": [14, 19, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 159, 170], "rewardwrapp": 168, "rider": 35, "riverraid": 97, "rl": [158, 161], "road": 98, "robot": [148, 170], "robotank": 99, "run": 175, "runner": 98, "runtim": 9, "save": [9, 178], "seaquest": 100, "seed": [9, 161], "setup": [166, 170, 174, 178], "share": 13, "should": 161, "showcas": 178, "side": 161, "simpl": 159, "simul": 170, "sir": 101, "size": 175, "ski": 102, "slipperi": 152, "slow": 164, "solari": 103, "solut": [164, 166, 167], "solv": [174, 175], "space": [5, 6, 7, 8, 13, 104, 105, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159], "specif": 161, "speed": [163, 178], "split": 161, "standard": 3, "standup": 141, "star": 106, "start": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 159], "state": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 159, 166], "step": [1, 9, 158, 159, 160, 161, 164, 166, 170], "strategi": 164, "stuck": 164, "subclass": 166, "summari": 162, "superman": 107, "surround": 108, "swimmer": 146, "synchron": 178, "syncvectorenv": 12, "system": 148, "tabl": [161, 175], "tabular": [174, 175], "tac": 111, "taxi": 154, "telecommun": 148, "tenni": 109, "termin": [127, 128, 129, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 161, 167, 170], "test": [159, 161, 164], "tetri": 110, "text": 149, "thi": [87, 161], "think": [159, 174], "third": [148, 172], "tic": 111, "time": [112, 167, 175], "timelimit": 161, "tip": 159, "toe": 111, "toi": 149, "too": 164, "track": 162, "train": [136, 162, 163, 164, 170, 171, 173, 174, 176, 177, 178], "transit": [133, 134], "trondead": 113, "truncat": [135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 161, 167], "try": 178, "turmoil": 114, "tutankham": 115, "tutori": [1, 171, 172], "tweak": 170, "uncommon": 17, "understand": [158, 162, 164], "unstabl": 164, "up": [116, 163, 178], "updat": [161, 164], "us": [148, 159, 161, 166, 172, 175, 177, 178], "usag": 158, "util": [5, 8, 9, 13], "v": 164, "v0": [155, 156, 160, 161], "v1": [156, 161], "valid": 159, "variabl": 4, "vector": [5, 10, 13, 14, 20, 132, 163, 178], "vectorenv": 10, "ventur": 117, "version": [127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "video": [9, 118, 119, 120, 121, 148], "visual": [9, 174, 175], "visualis": 174, "walk": [151, 152], "walker": 127, "walker2d": 147, "war": 105, "we": 175, "weight": 178, "what": [158, 164], "when": 162, "who": 161, "why": [158, 161, 162], "wizard": 122, "wor": 122, "word": 123, "world": 159, "wrapper": [14, 15, 16, 17, 18, 19, 20, 159, 161, 166, 168], "write": 1, "yar": 124, "you": [159, 174], "your": [158, 159, 161, 162, 164, 166, 170], "yourself": 178, "youtub": 172, "zapper": 123, "zaxxon": 125, "zone": 34}}) \ No newline at end of file +Search.setIndex({"alltitles": {"0.12.5": [[155, "release-0-12-5"]], "0.19.0": [[155, "release-0-19-0"]], "0.22.0": [[155, "release-0-22-0"]], "0.23.0": [[155, "release-0-23-0"]], "0.23.1": [[155, "release-0-23-1"]], "0.24.0": [[155, "release-0-24-0"]], "0.24.1": [[155, "release-0-24-1"]], "0.25.0": [[155, "release-0-25-0"]], "0.25.1": [[155, "release-0-25-1"]], "0.25.2": [[155, "release-0-25-2"]], "0.26.0": [[155, "release-0-26-0"]], "0.26.1": [[155, "release-0-26-1"]], "0.26.2": [[155, "release-0-26-2"]], "1. Package Name Change": [[160, "package-name-change"]], "2. Seeding and Random Number Generation": [[160, "seeding-and-random-number-generation"]], "3. Environment Reset Changes": [[160, "environment-reset-changes"]], "4. Step Function: The done \u2192 terminated/truncated Split": [[160, "step-function-the-done-terminated-truncated-split"]], "404 - Page Not Found": [[0, null]], "5. Render Mode Changes": [[160, "render-mode-changes"]], "About the Environment: Blackjack": [[163, "about-the-environment-blackjack"]], "Acrobot": [[131, null]], "Action Masking in the Taxi Environment": [[173, null]], "Action Space": [[127, "action-space"], [128, "action-space"], [129, "action-space"], [131, "action-space"], [132, "action-space"], [133, "action-space"], [134, "action-space"], [135, "action-space"], [137, "action-space"], [138, "action-space"], [139, "action-space"], [140, "action-space"], [141, "action-space"], [142, "action-space"], [143, "action-space"], [144, "action-space"], [145, "action-space"], [146, "action-space"], [147, "action-space"], [150, "action-space"], [151, "action-space"], [152, "action-space"], [153, "action-space"], [154, "action-space"]], "Action Space Issues": [[159, "action-space-issues"]], "Action Wrappers": [[16, null]], "Action and observation spaces": [[158, "action-and-observation-spaces"]], "Adding Rendering": [[159, "adding-rendering"]], "Adding a new environment": [[1, "adding-a-new-environment"]], "Additional Methods": [[10, "additional-methods"], [11, "additional-methods"], [12, "additional-methods"]], "Additional functions": [[4, "additional-functions"]], "Advanced Environment Features": [[159, "advanced-environment-features"]], "Advantage Actor-Critic (A2C)": [[178, "advantage-actor-critic-a2c"]], "Adventure": [[22, null]], "AgileRL": [[171, "agilerl"]], "Air Raid": [[23, null]], "Algorithmic heuristics": [[162, "algorithmic-heuristics"]], "Alien": [[24, null]], "Alternative solutions": [[165, "alternative-solutions"]], "Amidar": [[25, null]], "Analyzing Training Results": [[163, "analyzing-training-results"]], "Ant": [[137, null]], "Arguments": [[127, "arguments"], [128, "arguments"], [129, "arguments"], [131, "arguments"], [132, "arguments"], [133, "arguments"], [134, "arguments"], [135, "arguments"], [137, "arguments"], [138, "arguments"], [139, "arguments"], [140, "arguments"], [141, "arguments"], [142, "arguments"], [143, "arguments"], [144, "arguments"], [145, "arguments"], [146, "arguments"], [147, "arguments"], [150, "arguments"], [151, "arguments"], [152, "arguments"], [153, "arguments"], [154, "arguments"]], "Assault": [[26, null]], "Asterix": [[27, null]], "Asteroids": [[28, null]], "AsyncVectorEnv": [[11, null]], "Atari": [[21, null]], "Atlantis": [[29, null]], "Atlantis2": [[30, null]], "Attributes": [[2, "attributes"], [5, "attributes"], [10, "attributes"], [15, "attributes"]], "Autonomous Driving environments": [[148, "autonomous-driving-environments"], [148, "id2"]], "Available Action Wrappers": [[16, "available-action-wrappers"]], "Backgammon": [[31, null]], "Bank Heist": [[32, null]], "Base Class": [[16, "base-class"]], "Basic Math": [[33, null]], "Basic Usage": [[158, null]], "Battle Zone": [[34, null]], "Beam Rider": [[35, null]], "Before You Code: Environment Design": [[159, "before-you-code-environment-design"]], "Berzerk": [[36, null]], "Best Practices Summary": [[161, "best-practices-summary"]], "Biological / Medical environments": [[148, "biological-medical-environments"]], "Bipedal Walker": [[127, null]], "Blackjack": [[37, null], [150, null]], "Boundary Handling Errors": [[159, "boundary-handling-errors"]], "Bowling": [[38, null]], "Box2D": [[126, null]], "Boxing": [[39, null]], "Breakout": [[40, null]], "Build the Documentation": [[1, "build-the-documentation"]], "Building a Q-Learning Agent": [[163, "building-a-q-learning-agent"]], "Building an agent": [[174, "building-an-agent"], [177, "building-an-agent"]], "Car Racing": [[128, null]], "Carnival": [[41, null]], "Cart Pole": [[132, null]], "Casino": [[42, null]], "Centipede": [[43, null]], "Check Environment Validity": [[159, "check-environment-validity"]], "Chopper Command": [[44, null]], "Classic Control": [[130, null]], "Cliff Walking": [[151, null]], "Cliff Walking Slippery": [[152, null]], "Close": [[165, "close"]], "Common Debug Issues": [[159, "common-debug-issues"]], "Common Environment Design Pitfalls": [[159, "common-environment-design-pitfalls"]], "Common Issues for Beginners": [[158, "common-issues-for-beginners"]], "Common Training Issues and Solutions": [[163, "common-training-issues-and-solutions"]], "Common Wrappers": [[17, "common-wrappers"]], "Comparing training performance across versions": [[136, "comparing-training-performance-across-versions"]], "Compatibility Helpers": [[160, "compatibility-helpers"]], "Composite Spaces": [[5, "composite-spaces"], [6, null]], "Constructing Observations": [[159, "constructing-observations"]], "Constructing Observations From Environment States": [[165, "constructing-observations-from-environment-states"]], "Converting Jax-based Functional environments to standard Env": [[3, "converting-jax-based-functional-environments-to-standard-env"]], "Core variables": [[4, "core-variables"]], "Crazy Climber": [[45, null]], "Create a Custom Environment": [[159, null]], "Creating Environment Instances": [[165, "creating-environment-instances"]], "Creating a Package": [[165, "creating-a-package"]], "Creating environments": [[2, "creating-environments"]], "Creating the Q-table": [[175, "creating-the-q-table"]], "Credits": [[127, "credits"], [128, "credits"], [129, "credits"]], "Crossbow": [[46, null]], "Darkchambers": [[47, null]], "Data Conversion Wrappers": [[17, "data-conversion-wrappers"]], "Debugging Your Environment": [[159, "debugging-your-environment"]], "Declaration and Initialization": [[165, "declaration-and-initialization"]], "Defender": [[48, null]], "Demon Attack": [[49, null]], "Description": [[127, "description"], [128, "description"], [129, "description"], [131, "description"], [132, "description"], [133, "description"], [134, "description"], [135, "description"], [137, "description"], [138, "description"], [139, "description"], [140, "description"], [141, "description"], [142, "description"], [143, "description"], [144, "description"], [145, "description"], [146, "description"], [147, "description"], [150, "description"], [151, "description"], [152, "description"], [153, "description"], [154, "description"]], "Design for Learning": [[159, "design-for-learning"]], "Domain Randomization": [[178, "domain-randomization"]], "Donkey Kong": [[50, null]], "Double Dunk": [[51, null]], "Earthworld": [[52, null]], "Economic / Financial environments": [[148, "economic-financial-environments"]], "Editing an environment page": [[1, "editing-an-environment-page"]], "Electrical / Energy environments": [[148, "electrical-energy-environments"]], "Elevator Action": [[53, null]], "Enduro": [[54, null]], "Entombed": [[55, null]], "Env": [[2, null]], "Environment Checking": [[9, "environment-checking"]], "Environment __init__": [[159, "environment-init"]], "Environment pickling": [[9, "environment-pickling"]], "Environment-Specific Changes": [[160, "environment-specific-changes"]], "Epilogue": [[169, "epilogue"]], "Episode End": [[131, "episode-end"], [132, "episode-end"], [133, "episode-end"], [134, "episode-end"], [137, "episode-end"], [138, "episode-end"], [139, "episode-end"], [140, "episode-end"], [141, "episode-end"], [142, "episode-end"], [143, "episode-end"], [144, "episode-end"], [145, "episode-end"], [146, "episode-end"], [147, "episode-end"], [150, "episode-end"], [151, "episode-end"], [152, "episode-end"], [153, "episode-end"], [154, "episode-end"]], "Episode Termination": [[127, "episode-termination"], [128, "episode-termination"], [129, "episode-termination"]], "Episode Truncation": [[135, "episode-truncation"]], "Et": [[56, null]], "Exact reproducibility": [[136, "exact-reproducibility"]], "Executing an action": [[163, "executing-an-action"], [174, "executing-an-action"]], "Explaining the Code Step by Step": [[158, "explaining-the-code-step-by-step"]], "Exploration vs Exploitation": [[163, "exploration-vs-exploitation"]], "External Environments": [[148, null]], "First-Party Environments": [[148, "first-party-environments"]], "Fishing Derby": [[57, null]], "Flag Capture": [[58, null]], "Freeway": [[59, null]], "Frogger": [[60, null]], "Frostbite": [[61, null]], "Frozen Lake": [[153, null]], "Functional Env": [[3, null]], "Fundamental Spaces": [[5, "fundamental-spaces"], [7, null]], "Galaxian": [[62, null]], "Game environments": [[148, "game-environments"]], "Generate your environment": [[165, "generate-your-environment"]], "Getting Help": [[160, "getting-help"]], "Gopher": [[63, null]], "Gravitar": [[64, null]], "GridWorld Example Design": [[159, "gridworld-example-design"]], "Gym Migration Guide": [[160, null]], "Gym Release Notes": [[155, null]], "Gymnasium Basics": [[164, null], [168, null], [170, "gymnasium-basics"]], "Gymnasium Release Notes": [[156, null]], "Gymnasium v1.1.1": [[156, "release-v1-1-1"]], "Gymnasium-docs": [[1, null]], "Gymnasium.vector.VectorEnv": [[10, "gymnasium-vector-vectorenv"]], "Half Cheetah": [[138, null]], "Handling Time Limits": [[166, null]], "Hangman": [[65, null]], "Haunted House": [[66, null]], "Hero": [[67, null]], "Hopper": [[139, null]], "How Action Masking Works": [[173, "how-action-masking-works"]], "Human Cannonball": [[68, null]], "Humanoid": [[140, null]], "Humanoid Standup": [[141, null]], "Ice Hockey": [[69, null]], "Implemented Action wrappers": [[14, "implemented-action-wrappers"]], "Implemented Data Conversion wrappers": [[14, "implemented-data-conversion-wrappers"]], "Implemented Observation wrappers": [[14, "implemented-observation-wrappers"]], "Implemented Reward wrappers": [[14, "implemented-reward-wrappers"]], "Implemented Wrappers": [[18, "implemented-wrappers"], [19, "implemented-wrappers"]], "Implementing Custom Wrappers": [[167, null]], "Implementing environments": [[2, "implementing-environments"]], "Importance in learning code": [[166, "importance-in-learning-code"]], "Imports and Environment Setup": [[174, "imports-and-environment-setup"]], "Information": [[150, "information"], [151, "information"], [152, "information"], [153, "information"], [154, "information"]], "Inheriting from gymnasium.ActionWrapper": [[167, "inheriting-from-gymnasium-actionwrapper"]], "Inheriting from gymnasium.ObservationWrapper": [[167, "inheriting-from-gymnasium-observationwrapper"]], "Inheriting from gymnasium.RewardWrapper": [[167, "inheriting-from-gymnasium-rewardwrapper"]], "Inheriting from gymnasium.Wrapper": [[167, "inheriting-from-gymnasium-wrapper"]], "Initializing Environments": [[158, "initializing-environments"]], "Instructions for modifying environment pages": [[1, "instructions-for-modifying-environment-pages"]], "Integration with Experiment Tracking": [[161, "integration-with-experiment-tracking"]], "Interpreting the Results": [[163, "interpreting-the-results"]], "Introduction": [[178, "introduction"]], "Inverted Double Pendulum": [[142, null]], "Inverted Pendulum": [[143, null]], "Jamesbond": [[70, null]], "Johnny Code from Youtube": [[171, "johnny-code-from-youtube"]], "Journey Escape": [[71, null]], "Kaboom": [[72, null]], "Kangaroo": [[73, null]], "Key Changes Breakdown": [[160, "key-changes-breakdown"]], "Key Design Questions": [[159, "key-design-questions"]], "Keystone Kapers": [[74, null]], "King Kong": [[75, null]], "Klax": [[76, null]], "Koolaid": [[77, null]], "Krull": [[78, null]], "Kung Fu Master": [[79, null]], "Laser Gates": [[80, null]], "List of Wrappers": [[20, null]], "Load custom quadruped robot environments": [[169, null]], "Loading OpenAI Gym environments": [[160, "loading-openai-gym-environments"]], "Lost Luggage": [[81, null]], "Lunar Lander": [[129, null]], "Make and register": [[4, null]], "Make your own custom environment": [[165, null]], "Making Vector Environments": [[10, "making-vector-environments"]], "Manual Testing with Known Actions": [[159, "manual-testing-with-known-actions"]], "Map size: 11 \\times 11": [[175, "map-size-11-times-11"]], "Map size: 4 \\times 4": [[175, "map-size-4-times-4"]], "Map size: 7 \\times 7": [[175, "map-size-7-times-7"]], "Map size: 9 \\times 9": [[175, "map-size-9-times-9"]], "Mario Bros": [[82, null]], "Mathematics / Computational": [[148, "mathematics-computational"]], "Methods": [[2, "methods"], [5, "methods"], [10, "methods"], [15, "methods"]], "Miniature Golf": [[83, null]], "Misc Wrappers": [[17, null]], "Miscellaneous": [[13, "miscellaneous"]], "Modifying the environment": [[158, "modifying-the-environment"]], "Montezuma Revenge": [[84, null]], "More Information": [[161, "more-information"]], "Mountain Car": [[133, null]], "Mountain Car Continuous": [[134, null]], "Mr Do": [[85, null]], "Ms Pacman": [[86, null]], "MuJoCo": [[136, null]], "Name This Game": [[87, null]], "New v0.26+ Code (Including v1.0.0)": [[160, "new-v0-26-code-including-v1-0-0"]], "Next Steps": [[158, "next-steps"], [159, "next-steps"], [163, "next-steps"]], "Notes": [[129, "notes"], [146, "notes"]], "Notice": [[178, "notice"]], "Observation Space": [[127, "observation-space"], [128, "observation-space"], [129, "observation-space"], [131, "observation-space"], [132, "observation-space"], [133, "observation-space"], [134, "observation-space"], [135, "observation-space"], [137, "observation-space"], [138, "observation-space"], [139, "observation-space"], [140, "observation-space"], [141, "observation-space"], [142, "observation-space"], [143, "observation-space"], [144, "observation-space"], [145, "observation-space"], [146, "observation-space"], [147, "observation-space"], [150, "observation-space"], [151, "observation-space"], [152, "observation-space"], [153, "observation-space"], [154, "observation-space"]], "Observation Wrappers": [[18, null]], "Observing the environment": [[174, "observing-the-environment"]], "Old to New Step API Compatibility": [[9, "old-to-new-step-api-compatibility"]], "Old v0.21 Code": [[160, "old-v0-21-code"]], "Optimizing training": [[162, "optimizing-training"]], "Othello": [[88, null]], "Other": [[148, "other"]], "Other environments": [[148, "other-environments"]], "Other steps": [[1, "other-steps"]], "Pacman": [[89, null]], "Parameterized Environments": [[159, "parameterized-environments"]], "Parameters we\u2019ll use": [[175, "parameters-we-ll-use"]], "Pendulum": [[135, null]], "Performance Analysis of Synchronous and Asynchronous Vectorized Environments": [[178, "performance-analysis-of-synchronous-and-asynchronous-vectorized-environments"]], "Phoenix": [[90, null]], "Pitfall": [[91, null]], "Pitfall2": [[92, null]], "Plot learning curve": [[177, "plot-learning-curve"]], "Plotting": [[178, "plotting"]], "Policy Network": [[177, "policy-network"]], "Pong": [[93, null]], "Pooyan": [[94, null]], "Private Eye": [[95, null]], "Pusher": [[144, null]], "Qbert": [[96, null]], "Quick Reference: Complete Changes Table": [[160, "quick-reference-complete-changes-table"]], "Reacher": [[145, null]], "Real-World Environment Design Tips": [[159, "real-world-environment-design-tips"]], "Recommended solution": [[165, "recommended-solution"]], "Recording Agents": [[161, null]], "Recording During Training (Periodic)": [[161, "recording-during-training-periodic"]], "Recording Every Episode (Evaluation)": [[161, "recording-every-episode-evaluation"]], "References": [[128, "references"], [131, "references"], [150, "references"], [151, "references"], [152, "references"], [154, "references"], [175, "references"], [177, "references"], [178, "references"]], "Registering Envs": [[165, "registering-envs"]], "Registering and making the environment": [[159, "registering-and-making-the-environment"]], "Removed Environments": [[160, "removed-environments"]], "Rendering": [[165, "rendering"]], "Rendering Arguments": [[136, "rendering-arguments"]], "Rendering Backend": [[136, "rendering-backend"]], "Reset": [[165, "reset"]], "Reset Arguments": [[128, "reset-arguments"]], "Reset function": [[159, "reset-function"]], "Results Analysis": [[173, "results-analysis"]], "Reward": [[134, "reward"], [151, "reward"], [152, "reward"]], "Reward Design Issues": [[159, "reward-design-issues"]], "Reward Wrappers": [[19, null]], "Reward:": [[133, "reward"]], "Rewards": [[127, "rewards"], [128, "rewards"], [129, "rewards"], [131, "rewards"], [132, "rewards"], [135, "rewards"], [137, "rewards"], [138, "rewards"], [139, "rewards"], [140, "rewards"], [141, "rewards"], [142, "rewards"], [143, "rewards"], [144, "rewards"], [145, "rewards"], [146, "rewards"], [147, "rewards"], [150, "rewards"], [153, "rewards"], [154, "rewards"]], "Riverraid": [[97, null]], "Road Runner": [[98, null]], "Robotank": [[99, null]], "Robotics environments": [[148, "robotics-environments"], [148, "id1"]], "Running the Experiment": [[173, "running-the-experiment"]], "Running the environment": [[175, "running-the-environment"]], "Runtime Performance benchmark": [[9, "runtime-performance-benchmark"]], "Save Rendering Videos": [[9, "save-rendering-videos"]], "Saving/ Loading Weights": [[178, "saving-loading-weights"]], "Seaquest": [[100, null]], "Seeding": [[9, "seeding"]], "Setup": [[165, "setup"], [169, "setup"], [178, "setup"]], "Shared Memory for a Space": [[13, "shared-memory-for-a-space"]], "Showcase the Agent": [[178, "showcase-the-agent"]], "Side-by-Side Code Comparison": [[160, "side-by-side-code-comparison"]], "Sir Lancelot": [[101, null]], "Skiing": [[102, null]], "Solaris": [[103, null]], "Solution": [[166, "solution"]], "Solving Blackjack with Tabular Q-Learning": [[174, null]], "Solving Frozenlake with Tabular Q-Learning": [[175, null]], "Space Invaders": [[104, null]], "Space War": [[105, null]], "Spaces": [[5, null]], "Spaces Utils": [[8, null]], "Speeding Up Training": [[162, null]], "Speeding up A2C Training with Vector Envs": [[178, null]], "Star Gunner": [[106, null]], "Start Simple, Add Complexity Gradually": [[159, "start-simple-add-complexity-gradually"]], "Starting State": [[127, "starting-state"], [128, "starting-state"], [129, "starting-state"], [131, "starting-state"], [132, "starting-state"], [133, "starting-state"], [134, "starting-state"], [135, "starting-state"], [137, "starting-state"], [138, "starting-state"], [139, "starting-state"], [140, "starting-state"], [141, "starting-state"], [142, "starting-state"], [143, "starting-state"], [144, "starting-state"], [145, "starting-state"], [146, "starting-state"], [147, "starting-state"], [150, "starting-state"], [151, "starting-state"], [152, "starting-state"], [153, "starting-state"], [154, "starting-state"]], "State Representation Problems": [[159, "state-representation-problems"]], "Step": [[165, "step"]], "Step 0.1 - Download a Robot Model": [[169, "step-0-1-download-a-robot-model"]], "Step 1 - Load the model": [[169, "step-1-load-the-model"]], "Step 2 - Tweaking the Environment Parameters": [[169, "step-2-tweaking-the-environment-parameters"]], "Step 2.1 - Tweaking the Environment Simulation Parameters": [[169, "step-2-1-tweaking-the-environment-simulation-parameters"]], "Step 2.2 - Tweaking the Environment Termination Parameters": [[169, "step-2-2-tweaking-the-environment-termination-parameters"]], "Step 2.3 - Tweaking the Environment Reward Parameters": [[169, "step-2-3-tweaking-the-environment-reward-parameters"]], "Step 2.4 - Tweaking the Environment Observation Parameters": [[169, "step-2-4-tweaking-the-environment-observation-parameters"]], "Step 3 - Train your Agent": [[169, "step-3-train-your-agent"]], "Step API Compatibility": [[160, "step-api-compatibility"]], "Step function": [[159, "step-function"]], "Subclassing gymnasium.Env": [[165, "subclassing-gymnasium-env"]], "Superman": [[107, null]], "Surround": [[108, null]], "Swimmer": [[146, null]], "SyncVectorEnv": [[12, null]], "Taxi": [[154, null]], "Telecommunication Systems environments": [[148, "telecommunication-systems-environments"]], "Tennis": [[109, null]], "Termination": [[137, "termination"], [138, "termination"], [139, "termination"], [140, "termination"], [141, "termination"], [142, "termination"], [143, "termination"], [144, "termination"], [145, "termination"], [146, "termination"], [147, "termination"], [166, "termination"]], "Testing Your Migration": [[160, "testing-your-migration"]], "Testing Your Trained Agent": [[163, "testing-your-trained-agent"]], "Tetris": [[110, null]], "The FrozenLake environment": [[175, "the-frozenlake-environment"]], "The Learning Process": [[163, "the-learning-process"]], "The Training Loop": [[163, "the-training-loop"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Think About Your Research Question": [[159, "think-about-your-research-question"]], "Think you can do better?": [[174, "think-you-can-do-better"]], "Third-Party Environments using Gym": [[148, "third-party-environments-using-gym"]], "Third-Party Tutorials": [[171, null]], "Third-Party tutorials about gymnasium": [[171, "third-party-tutorials-about-gymnasium"]], "Third-Party tutorials about libraries that use gymnasium": [[171, "third-party-tutorials-about-libraries-that-use-gymnasium"]], "Third-party environments with Gymnasium": [[148, "third-party-environments-with-gymnasium"]], "Tic Tac Toe 3D": [[111, null]], "Time Pilot": [[112, null]], "TimeLimit Wrapper Changes": [[160, "timelimit-wrapper-changes"]], "Toy Text": [[149, null]], "Training Agents": [[170, "training-agents"], [172, null], [176, null]], "Training Recording Benefits": [[161, "training-recording-benefits"]], "Training an Agent": [[163, null]], "Training the A2C Agent": [[178, "training-the-a2c-agent"]], "Training the Agent": [[163, "training-the-agent"]], "Training using REINFORCE for Mujoco": [[177, null]], "Transition Dynamics:": [[133, "transition-dynamics"], [134, "transition-dynamics"]], "Trondead": [[113, null]], "Truncation": [[137, "truncation"], [138, "truncation"], [139, "truncation"], [140, "truncation"], [141, "truncation"], [142, "truncation"], [143, "truncation"], [144, "truncation"], [145, "truncation"], [146, "truncation"], [147, "truncation"], [166, "truncation"]], "Try playing the environment yourself": [[178, "try-playing-the-environment-yourself"]], "Turmoil": [[114, null]], "Tutankham": [[115, null]], "Tutorials": [[170, null]], "Uncommon Wrappers": [[17, "uncommon-wrappers"]], "Understanding Q-Learning Intuitively": [[163, "understanding-q-learning-intuitively"]], "Understanding the Agent-Environment Loop": [[158, "understanding-the-agent-environment-loop"]], "Understanding the Output": [[161, "understanding-the-output"]], "Understanding the Q-Learning Update": [[163, "understanding-the-q-learning-update"]], "Understanding the Taxi Environment": [[173, "understanding-the-taxi-environment"]], "Up N Down": [[116, null]], "Using Vectorized Environments": [[178, "using-vectorized-environments"]], "Using Wrappers": [[159, "using-wrappers"], [165, "using-wrappers"]], "Utility functions": [[5, "utility-functions"], [9, null], [13, null]], "Vector Only wrappers": [[14, "vector-only-wrappers"]], "Vector Utility functions": [[5, "vector-utility-functions"]], "Vector only Wrappers": [[20, "vector-only-wrappers"]], "Vectorize": [[10, null]], "Vectorized Common wrappers": [[14, "vectorized-common-wrappers"]], "Vectorized environment": [[132, "vectorized-environment"]], "Vectorized environments": [[162, "vectorized-environments"]], "Vectorizing Spaces": [[13, "vectorizing-spaces"]], "Venture": [[117, null]], "Version History": [[127, "version-history"], [128, "version-history"], [129, "version-history"], [131, "version-history"], [132, "version-history"], [133, "version-history"], [134, "version-history"], [135, "version-history"], [137, "version-history"], [138, "version-history"], [139, "version-history"], [140, "version-history"], [141, "version-history"], [142, "version-history"], [143, "version-history"], [144, "version-history"], [145, "version-history"], [146, "version-history"], [147, "version-history"], [150, "version-history"], [151, "version-history"], [152, "version-history"], [153, "version-history"], [154, "version-history"]], "Versions": [[136, "versions"]], "Video Checkers": [[118, null]], "Video Chess": [[119, null]], "Video Cube": [[120, null]], "Video Game environments": [[148, "video-game-environments"]], "Video Pinball": [[121, null]], "Visualising the policy": [[174, "visualising-the-policy"]], "Visualization": [[9, "visualization"], [175, "visualization"]], "Visualizing Results": [[173, "visualizing-results"]], "Visualizing the training": [[174, "visualizing-the-training"]], "Walker2D": [[147, null]], "What is Reinforcement Learning?": [[158, "what-is-reinforcement-learning"]], "What to Expect During Training": [[163, "what-to-expect-during-training"]], "When to Record": [[161, "when-to-record"]], "Who Should Read This Guide?": [[160, "who-should-read-this-guide"]], "Why Did the API Change?": [[160, "why-did-the-api-change"]], "Why Gymnasium?": [[158, "why-gymnasium"]], "Why Record Your Agent?": [[161, "why-record-your-agent"]], "Wizard Of Wor": [[122, null]], "Word Zapper": [[123, null]], "Wrappers": [[14, null], [15, null]], "Writing Tutorials": [[1, "writing-tutorials"]], "Yars Revenge": [[124, null]], "Your First RL Program": [[158, "your-first-rl-program"]], "Zaxxon": [[125, null]], "freeCodeCamp from Youtube": [[171, "freecodecamp-from-youtube"]], "v0.20.0": [[155, "release-v0-20-0"]], "v0.21.0": [[155, "release-v0-21-0"]], "v0.26.0: Initial Release": [[156, "release-v0-26-0"]], "v0.26.1": [[156, "release-v0-26-1"]], "v0.26.2 ": [[156, "release-v0-26-2"]], "v0.26.3": [[156, "release-v0-26-3"]], "v0.27.0": [[156, "release-v0-27-0"]], "v0.27.1": [[156, "release-v0-27-1"]], "v0.28.0": [[156, "release-v0-28-0"]], "v0.28.1": [[156, "release-v0-28-1"]], "v0.29.0": [[156, "release-v0-29-0"]], "v0.29.1 ": [[156, "release-v0-29-1"]], "v0.7.3": [[155, "release-v0-7-3"]], "v0.7.4": [[155, "release-v0-7-4"]], "v0.9.5": [[155, "release-v0-9-5"]], "v0.9.6": [[155, "release-v0-9-6"]], "v1.0.0": [[156, "release-v1-0-0"]], "v1.0.0a1: v1.0.0 alpha1 ": [[156, "release-v1-0-0a1"]], "v1.0.0a2: v1.0.0 alpha 2": [[156, "release-v1-0-0a2"]], "v1.1.0": [[156, "release-v1-1-0"]], "v1.2.0": [[156, "release-v1-2-0"]], "\ud83d\udea8 Agent Gets Stuck in Poor Strategy": [[163, "agent-gets-stuck-in-poor-strategy"]], "\ud83d\udea8 Agent Never Improves": [[163, "agent-never-improves"]], "\ud83d\udea8 Learning Too Slow": [[163, "learning-too-slow"]], "\ud83d\udea8 Unstable Training": [[163, "unstable-training"]]}, "docnames": ["404", "README", "api/env", "api/functional", "api/registry", "api/spaces", "api/spaces/composite", "api/spaces/fundamental", "api/spaces/utils", "api/utils", "api/vector", "api/vector/async_vector_env", "api/vector/sync_vector_env", "api/vector/utils", "api/vector/wrappers", "api/wrappers", "api/wrappers/action_wrappers", "api/wrappers/misc_wrappers", "api/wrappers/observation_wrappers", "api/wrappers/reward_wrappers", "api/wrappers/table", "environments/atari", "environments/atari/adventure", "environments/atari/air_raid", "environments/atari/alien", "environments/atari/amidar", "environments/atari/assault", "environments/atari/asterix", "environments/atari/asteroids", "environments/atari/atlantis", "environments/atari/atlantis2", "environments/atari/backgammon", "environments/atari/bank_heist", "environments/atari/basic_math", "environments/atari/battle_zone", "environments/atari/beam_rider", "environments/atari/berzerk", "environments/atari/blackjack", "environments/atari/bowling", "environments/atari/boxing", "environments/atari/breakout", "environments/atari/carnival", "environments/atari/casino", "environments/atari/centipede", "environments/atari/chopper_command", "environments/atari/crazy_climber", "environments/atari/crossbow", "environments/atari/darkchambers", "environments/atari/defender", "environments/atari/demon_attack", "environments/atari/donkey_kong", "environments/atari/double_dunk", "environments/atari/earthworld", "environments/atari/elevator_action", "environments/atari/enduro", "environments/atari/entombed", "environments/atari/et", "environments/atari/fishing_derby", "environments/atari/flag_capture", "environments/atari/freeway", "environments/atari/frogger", "environments/atari/frostbite", "environments/atari/galaxian", "environments/atari/gopher", "environments/atari/gravitar", "environments/atari/hangman", "environments/atari/haunted_house", "environments/atari/hero", "environments/atari/human_cannonball", "environments/atari/ice_hockey", "environments/atari/jamesbond", "environments/atari/journey_escape", "environments/atari/kaboom", "environments/atari/kangaroo", "environments/atari/keystone_kapers", "environments/atari/king_kong", "environments/atari/klax", "environments/atari/koolaid", "environments/atari/krull", "environments/atari/kung_fu_master", "environments/atari/laser_gates", "environments/atari/lost_luggage", "environments/atari/mario_bros", "environments/atari/miniature_golf", "environments/atari/montezuma_revenge", "environments/atari/mr_do", "environments/atari/ms_pacman", "environments/atari/name_this_game", "environments/atari/othello", "environments/atari/pacman", "environments/atari/phoenix", "environments/atari/pitfall", "environments/atari/pitfall2", "environments/atari/pong", "environments/atari/pooyan", "environments/atari/private_eye", "environments/atari/qbert", "environments/atari/riverraid", "environments/atari/road_runner", "environments/atari/robotank", "environments/atari/seaquest", "environments/atari/sir_lancelot", "environments/atari/skiing", "environments/atari/solaris", "environments/atari/space_invaders", "environments/atari/space_war", "environments/atari/star_gunner", "environments/atari/superman", "environments/atari/surround", "environments/atari/tennis", "environments/atari/tetris", "environments/atari/tic_tac_toe_3d", "environments/atari/time_pilot", "environments/atari/trondead", "environments/atari/turmoil", "environments/atari/tutankham", "environments/atari/up_n_down", "environments/atari/venture", "environments/atari/video_checkers", "environments/atari/video_chess", "environments/atari/video_cube", "environments/atari/video_pinball", "environments/atari/wizard_of_wor", "environments/atari/word_zapper", "environments/atari/yars_revenge", "environments/atari/zaxxon", "environments/box2d", "environments/box2d/bipedal_walker", "environments/box2d/car_racing", "environments/box2d/lunar_lander", "environments/classic_control", "environments/classic_control/acrobot", "environments/classic_control/cart_pole", "environments/classic_control/mountain_car", "environments/classic_control/mountain_car_continuous", "environments/classic_control/pendulum", "environments/mujoco", "environments/mujoco/ant", "environments/mujoco/half_cheetah", "environments/mujoco/hopper", "environments/mujoco/humanoid", "environments/mujoco/humanoid_standup", "environments/mujoco/inverted_double_pendulum", "environments/mujoco/inverted_pendulum", "environments/mujoco/pusher", "environments/mujoco/reacher", "environments/mujoco/swimmer", "environments/mujoco/walker2d", "environments/third_party_environments", "environments/toy_text", "environments/toy_text/blackjack", "environments/toy_text/cliff_walking", "environments/toy_text/cliff_walking_slippery", "environments/toy_text/frozen_lake", "environments/toy_text/taxi", "gym_release_notes/index", "gymnasium_release_notes/index", "index", "introduction/basic_usage", "introduction/create_custom_env", "introduction/migration_guide", "introduction/record_agent", "introduction/speed_up_env", "introduction/train_agent", "tutorials/gymnasium_basics/README", "tutorials/gymnasium_basics/environment_creation", "tutorials/gymnasium_basics/handling_time_limits", "tutorials/gymnasium_basics/implementing_custom_wrappers", "tutorials/gymnasium_basics/index", "tutorials/gymnasium_basics/load_quadruped_model", "tutorials/index", "tutorials/third-party-tutorials", "tutorials/training_agents/README", "tutorials/training_agents/action_masking_taxi", "tutorials/training_agents/blackjack_q_learning", "tutorials/training_agents/frozenlake_q_learning", "tutorials/training_agents/index", "tutorials/training_agents/mujoco_reinforce", "tutorials/training_agents/vector_a2c"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1}, "filenames": ["404.md", "README.md", "api/env.md", "api/functional.md", "api/registry.md", "api/spaces.md", "api/spaces/composite.md", "api/spaces/fundamental.md", "api/spaces/utils.md", "api/utils.md", "api/vector.md", "api/vector/async_vector_env.md", "api/vector/sync_vector_env.md", "api/vector/utils.md", "api/vector/wrappers.md", "api/wrappers.md", "api/wrappers/action_wrappers.md", "api/wrappers/misc_wrappers.md", "api/wrappers/observation_wrappers.md", "api/wrappers/reward_wrappers.md", "api/wrappers/table.md", "environments/atari.md", "environments/atari/adventure.md", "environments/atari/air_raid.md", "environments/atari/alien.md", "environments/atari/amidar.md", "environments/atari/assault.md", "environments/atari/asterix.md", "environments/atari/asteroids.md", "environments/atari/atlantis.md", "environments/atari/atlantis2.md", "environments/atari/backgammon.md", "environments/atari/bank_heist.md", "environments/atari/basic_math.md", "environments/atari/battle_zone.md", "environments/atari/beam_rider.md", "environments/atari/berzerk.md", "environments/atari/blackjack.md", "environments/atari/bowling.md", "environments/atari/boxing.md", "environments/atari/breakout.md", "environments/atari/carnival.md", "environments/atari/casino.md", "environments/atari/centipede.md", "environments/atari/chopper_command.md", "environments/atari/crazy_climber.md", "environments/atari/crossbow.md", "environments/atari/darkchambers.md", "environments/atari/defender.md", "environments/atari/demon_attack.md", "environments/atari/donkey_kong.md", "environments/atari/double_dunk.md", "environments/atari/earthworld.md", "environments/atari/elevator_action.md", "environments/atari/enduro.md", "environments/atari/entombed.md", "environments/atari/et.md", "environments/atari/fishing_derby.md", "environments/atari/flag_capture.md", "environments/atari/freeway.md", "environments/atari/frogger.md", "environments/atari/frostbite.md", "environments/atari/galaxian.md", "environments/atari/gopher.md", "environments/atari/gravitar.md", "environments/atari/hangman.md", "environments/atari/haunted_house.md", "environments/atari/hero.md", "environments/atari/human_cannonball.md", "environments/atari/ice_hockey.md", "environments/atari/jamesbond.md", "environments/atari/journey_escape.md", "environments/atari/kaboom.md", "environments/atari/kangaroo.md", "environments/atari/keystone_kapers.md", "environments/atari/king_kong.md", "environments/atari/klax.md", "environments/atari/koolaid.md", "environments/atari/krull.md", "environments/atari/kung_fu_master.md", "environments/atari/laser_gates.md", "environments/atari/lost_luggage.md", "environments/atari/mario_bros.md", "environments/atari/miniature_golf.md", "environments/atari/montezuma_revenge.md", "environments/atari/mr_do.md", "environments/atari/ms_pacman.md", "environments/atari/name_this_game.md", "environments/atari/othello.md", "environments/atari/pacman.md", "environments/atari/phoenix.md", "environments/atari/pitfall.md", "environments/atari/pitfall2.md", "environments/atari/pong.md", "environments/atari/pooyan.md", "environments/atari/private_eye.md", "environments/atari/qbert.md", "environments/atari/riverraid.md", "environments/atari/road_runner.md", "environments/atari/robotank.md", "environments/atari/seaquest.md", "environments/atari/sir_lancelot.md", "environments/atari/skiing.md", "environments/atari/solaris.md", "environments/atari/space_invaders.md", "environments/atari/space_war.md", "environments/atari/star_gunner.md", "environments/atari/superman.md", "environments/atari/surround.md", "environments/atari/tennis.md", "environments/atari/tetris.md", "environments/atari/tic_tac_toe_3d.md", "environments/atari/time_pilot.md", "environments/atari/trondead.md", "environments/atari/turmoil.md", "environments/atari/tutankham.md", "environments/atari/up_n_down.md", "environments/atari/venture.md", "environments/atari/video_checkers.md", "environments/atari/video_chess.md", "environments/atari/video_cube.md", "environments/atari/video_pinball.md", "environments/atari/wizard_of_wor.md", "environments/atari/word_zapper.md", "environments/atari/yars_revenge.md", "environments/atari/zaxxon.md", "environments/box2d.md", "environments/box2d/bipedal_walker.md", "environments/box2d/car_racing.md", "environments/box2d/lunar_lander.md", "environments/classic_control.md", "environments/classic_control/acrobot.md", "environments/classic_control/cart_pole.md", "environments/classic_control/mountain_car.md", "environments/classic_control/mountain_car_continuous.md", "environments/classic_control/pendulum.md", "environments/mujoco.md", "environments/mujoco/ant.md", "environments/mujoco/half_cheetah.md", "environments/mujoco/hopper.md", "environments/mujoco/humanoid.md", "environments/mujoco/humanoid_standup.md", "environments/mujoco/inverted_double_pendulum.md", "environments/mujoco/inverted_pendulum.md", "environments/mujoco/pusher.md", "environments/mujoco/reacher.md", "environments/mujoco/swimmer.md", "environments/mujoco/walker2d.md", "environments/third_party_environments.md", "environments/toy_text.md", "environments/toy_text/blackjack.md", "environments/toy_text/cliff_walking.md", "environments/toy_text/cliff_walking_slippery.md", "environments/toy_text/frozen_lake.md", "environments/toy_text/taxi.md", "gym_release_notes/index.md", "gymnasium_release_notes/index.md", "index.md", "introduction/basic_usage.md", "introduction/create_custom_env.md", "introduction/migration_guide.md", "introduction/record_agent.md", "introduction/speed_up_env.md", "introduction/train_agent.md", "tutorials/gymnasium_basics/README.rst", "tutorials/gymnasium_basics/environment_creation.rst", "tutorials/gymnasium_basics/handling_time_limits.rst", "tutorials/gymnasium_basics/implementing_custom_wrappers.rst", "tutorials/gymnasium_basics/index.rst", "tutorials/gymnasium_basics/load_quadruped_model.rst", "tutorials/index.rst", "tutorials/third-party-tutorials.md", "tutorials/training_agents/README.rst", "tutorials/training_agents/action_masking_taxi.rst", "tutorials/training_agents/blackjack_q_learning.rst", "tutorials/training_agents/frozenlake_q_learning.rst", "tutorials/training_agents/index.rst", "tutorials/training_agents/mujoco_reinforce.rst", "tutorials/training_agents/vector_a2c.rst"], "indexentries": {"action() (gymnasium.actionwrapper method)": [[16, "gymnasium.ActionWrapper.action", false]], "action_space (gymnasium.env attribute)": [[2, "gymnasium.Env.action_space", false]], "action_space (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.action_space", false]], "action_space (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.action_space", false]], "actions() (gymnasium.vector.vectoractionwrapper method)": [[14, "gymnasium.vector.VectorActionWrapper.actions", false]], "actionwrapper (class in gymnasium)": [[16, "gymnasium.ActionWrapper", false]], "addrenderobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.AddRenderObservation", false]], "arrayconversion (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.ArrayConversion", false]], "arrayconversion (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ArrayConversion", false]], "asyncvectorenv (class in gymnasium.vector)": [[11, "gymnasium.vector.AsyncVectorEnv", false]], "ataripreprocessing (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.AtariPreprocessing", false]], "autoreset (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.Autoreset", false]], "batch_space() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.batch_space", false]], "benchmark_init() (in module gymnasium.utils.performance)": [[9, "gymnasium.utils.performance.benchmark_init", false]], "benchmark_render() (in module gymnasium.utils.performance)": [[9, "gymnasium.utils.performance.benchmark_render", false]], "benchmark_step() (in module gymnasium.utils.performance)": [[9, "gymnasium.utils.performance.benchmark_step", false]], "box (class in gymnasium.spaces)": [[7, "gymnasium.spaces.Box", false]], "call() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.call", false]], "call() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.call", false]], "callback() (gymnasium.utils.play.playplot method)": [[9, "gymnasium.utils.play.PlayPlot.callback", false]], "capped_cubic_video_schedule() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.capped_cubic_video_schedule", false]], "check_env() (in module gymnasium.utils.env_checker)": [[9, "gymnasium.utils.env_checker.check_env", false]], "clear_mpi_env_vars() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.clear_mpi_env_vars", false]], "clipaction (class in gymnasium.wrappers)": [[16, "gymnasium.wrappers.ClipAction", false]], "clipaction (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ClipAction", false]], "clipreward (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.ClipReward", false]], "clipreward (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ClipReward", false]], "close() (gymnasium.env method)": [[2, "gymnasium.Env.close", false]], "close() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.close", false]], "close() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.close", false]], "close() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.close", false]], "close() (gymnasium.vector.vectorwrapper method)": [[14, "gymnasium.vector.VectorWrapper.close", false]], "close() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.close", false]], "closed (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.closed", false]], "cloudpicklewrapper() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.CloudpickleWrapper", false]], "concatenate() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.concatenate", false]], "contains() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.contains", false]], "convert_to_done_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_done_step_api", false]], "convert_to_terminated_truncated_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_terminated_truncated_step_api", false]], "create_empty_array() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.create_empty_array", false]], "create_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.create_shared_memory", false]], "current_namespace (gymnasium.envs.registration attribute)": [[4, "gymnasium.envs.registration.current_namespace", false]], "delayobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.DelayObservation", false]], "dict (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Dict", false]], "dictinfotolist (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.DictInfoToList", false]], "discrete (class in gymnasium.spaces)": [[7, "gymnasium.spaces.Discrete", false]], "dtype (gymnasium.spaces.space property)": [[5, "gymnasium.spaces.Space.dtype", false]], "dtypeobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.DtypeObservation", false]], "dtypeobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.DtypeObservation", false]], "env (class in gymnasium)": [[2, "gymnasium.Env", false]], "env (gymnasium.wrapper attribute)": [[15, "gymnasium.Wrapper.env", false]], "envspec (class in gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.EnvSpec", false]], "ezpickle (class in gymnasium.utils.ezpickle)": [[9, "gymnasium.utils.ezpickle.EzPickle", false]], "filterobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.FilterObservation", false]], "filterobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.FilterObservation", false]], "find_highest_version() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.find_highest_version", false]], "flatdim() (in module gymnasium.spaces.utils)": [[8, "gymnasium.spaces.utils.flatdim", false]], "flatten() (in module gymnasium.spaces.utils)": [[8, "gymnasium.spaces.utils.flatten", false]], "flatten_space() (in module gymnasium.spaces.utils)": [[8, "gymnasium.spaces.utils.flatten_space", false]], "flattenobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.FlattenObservation", false]], "flattenobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.FlattenObservation", false]], "framestackobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.FrameStackObservation", false]], "from_jsonable() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.from_jsonable", false]], "funcenv (class in gymnasium.experimental.functional)": [[3, "gymnasium.experimental.functional.FuncEnv", false]], "functionaljaxenv (class in gymnasium.envs.functional_jax_env)": [[3, "gymnasium.envs.functional_jax_env.FunctionalJaxEnv", false]], "get_attr() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.get_attr", false]], "get_attr() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.get_attr", false]], "get_env_id() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.get_env_id", false]], "get_wrapper_attr() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.get_wrapper_attr", false]], "graph (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Graph", false]], "grayscaleobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.GrayscaleObservation", false]], "grayscaleobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.GrayscaleObservation", false]], "gymnasium.spaces": [[5, "module-gymnasium.spaces", false]], "gymnasium.wrappers": [[15, "module-gymnasium.wrappers", false]], "humanrendering (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.HumanRendering", false]], "initial() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.initial", false]], "is_bounded() (gymnasium.spaces.box method)": [[7, "gymnasium.spaces.Box.is_bounded", false]], "is_np_flattenable (gymnasium.spaces.space property)": [[5, "gymnasium.spaces.Space.is_np_flattenable", false]], "iterate() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.iterate", false]], "jaxtonumpy (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.JaxToNumpy", false]], "jaxtonumpy (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.JaxToNumpy", false]], "jaxtotorch (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.JaxToTorch", false]], "jaxtotorch (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.JaxToTorch", false]], "load_env_creator() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.load_env_creator", false]], "make() (in module gymnasium)": [[4, "gymnasium.make", false]], "make_vec() (in module gymnasium)": [[4, "gymnasium.make_vec", false]], "maxandskipobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.MaxAndSkipObservation", false]], "metadata (gymnasium.env attribute)": [[2, "gymnasium.Env.metadata", false]], "metadata (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.metadata", false]], "metadata (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.metadata", false]], "module": [[5, "module-gymnasium.spaces", false], [15, "module-gymnasium.wrappers", false]], "multibinary (class in gymnasium.spaces)": [[7, "gymnasium.spaces.MultiBinary", false]], "multidiscrete (class in gymnasium.spaces)": [[7, "gymnasium.spaces.MultiDiscrete", false]], "namespace() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.namespace", false]], "normalizeobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.NormalizeObservation", false]], "normalizeobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.NormalizeObservation", false]], "normalizereward (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.NormalizeReward", false]], "normalizereward (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.NormalizeReward", false]], "np_random (gymnasium.env property)": [[2, "gymnasium.Env.np_random", false]], "np_random (gymnasium.spaces.space property)": [[5, "gymnasium.spaces.Space.np_random", false]], "np_random (gymnasium.vector.asyncvectorenv property)": [[11, "gymnasium.vector.AsyncVectorEnv.np_random", false]], "np_random (gymnasium.vector.syncvectorenv property)": [[12, "gymnasium.vector.SyncVectorEnv.np_random", false]], "np_random (gymnasium.vector.vectorenv property)": [[10, "gymnasium.vector.VectorEnv.np_random", false]], "np_random (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.np_random", false]], "np_random() (in module gymnasium.utils.seeding)": [[9, "gymnasium.utils.seeding.np_random", false]], "np_random_seed (gymnasium.env property)": [[2, "gymnasium.Env.np_random_seed", false]], "np_random_seed (gymnasium.vector.asyncvectorenv property)": [[11, "gymnasium.vector.AsyncVectorEnv.np_random_seed", false]], "np_random_seed (gymnasium.vector.syncvectorenv property)": [[12, "gymnasium.vector.SyncVectorEnv.np_random_seed", false]], "np_random_seed (gymnasium.vector.vectorenv property)": [[10, "gymnasium.vector.VectorEnv.np_random_seed", false]], "np_random_seed (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.np_random_seed", false]], "num_envs (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.num_envs", false]], "numpytotorch (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.NumpyToTorch", false]], "numpytotorch (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.NumpyToTorch", false]], "observation() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.observation", false]], "observation() (gymnasium.observationwrapper method)": [[18, "gymnasium.ObservationWrapper.observation", false]], "observation_space (gymnasium.env attribute)": [[2, "gymnasium.Env.observation_space", false]], "observation_space (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.observation_space", false]], "observation_space (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.observation_space", false]], "observations() (gymnasium.vector.vectorobservationwrapper method)": [[14, "gymnasium.vector.VectorObservationWrapper.observations", false]], "observationwrapper (class in gymnasium)": [[18, "gymnasium.ObservationWrapper", false]], "oneof (class in gymnasium.spaces)": [[6, "gymnasium.spaces.OneOf", false]], "orderenforcing (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.OrderEnforcing", false]], "parse_env_id() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.parse_env_id", false]], "passiveenvchecker (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.PassiveEnvChecker", false]], "play() (in module gymnasium.utils.play)": [[9, "gymnasium.utils.play.play", false]], "playablegame (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayableGame", false]], "playplot (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayPlot", false]], "pprint_registry() (in module gymnasium)": [[4, "gymnasium.pprint_registry", false]], "process_event() (gymnasium.utils.play.playablegame method)": [[9, "gymnasium.utils.play.PlayableGame.process_event", false]], "read_from_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.read_from_shared_memory", false]], "recordepisodestatistics (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.RecordEpisodeStatistics", false]], "recordepisodestatistics (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.RecordEpisodeStatistics", false]], "recordvideo (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.RecordVideo", false]], "register() (in module gymnasium)": [[4, "gymnasium.register", false]], "registry (gymnasium.envs.registration attribute)": [[4, "gymnasium.envs.registration.registry", false]], "render() (gymnasium.env method)": [[2, "gymnasium.Env.render", false]], "render() (gymnasium.envs.functional_jax_env.functionaljaxenv method)": [[3, "gymnasium.envs.functional_jax_env.FunctionalJaxEnv.render", false]], "render() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.render", false]], "render() (gymnasium.vector.vectorwrapper method)": [[14, "gymnasium.vector.VectorWrapper.render", false]], "render() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.render", false]], "render_close() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.render_close", false]], "render_image() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.render_image", false]], "render_init() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.render_init", false]], "render_mode (gymnasium.env attribute)": [[2, "gymnasium.Env.render_mode", false]], "render_mode (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.render_mode", false]], "rendercollection (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.RenderCollection", false]], "rescaleaction (class in gymnasium.wrappers)": [[16, "gymnasium.wrappers.RescaleAction", false]], "rescaleaction (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.RescaleAction", false]], "rescaleobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.RescaleObservation", false]], "rescaleobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.RescaleObservation", false]], "reset() (gymnasium.env method)": [[2, "gymnasium.Env.reset", false]], "reset() (gymnasium.envs.functional_jax_env.functionaljaxenv method)": [[3, "gymnasium.envs.functional_jax_env.FunctionalJaxEnv.reset", false]], "reset() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.reset", false]], "reset() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.reset", false]], "reset() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.reset", false]], "reset() (gymnasium.vector.vectorwrapper method)": [[14, "gymnasium.vector.VectorWrapper.reset", false]], "reset() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.reset", false]], "reshapeobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.ReshapeObservation", false]], "reshapeobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ReshapeObservation", false]], "resizeobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.ResizeObservation", false]], "resizeobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ResizeObservation", false]], "reward() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.reward", false]], "reward() (gymnasium.rewardwrapper method)": [[19, "gymnasium.RewardWrapper.reward", false]], "rewards() (gymnasium.vector.vectorrewardwrapper method)": [[14, "gymnasium.vector.VectorRewardWrapper.rewards", false]], "rewardwrapper (class in gymnasium)": [[19, "gymnasium.RewardWrapper", false]], "sample() (gymnasium.spaces.box method)": [[7, "gymnasium.spaces.Box.sample", false]], "sample() (gymnasium.spaces.dict method)": [[6, "gymnasium.spaces.Dict.sample", false]], "sample() (gymnasium.spaces.discrete method)": [[7, "gymnasium.spaces.Discrete.sample", false]], "sample() (gymnasium.spaces.graph method)": [[6, "gymnasium.spaces.Graph.sample", false]], "sample() (gymnasium.spaces.multibinary method)": [[7, "gymnasium.spaces.MultiBinary.sample", false]], "sample() (gymnasium.spaces.multidiscrete method)": [[7, "gymnasium.spaces.MultiDiscrete.sample", false]], "sample() (gymnasium.spaces.oneof method)": [[6, "gymnasium.spaces.OneOf.sample", false]], "sample() (gymnasium.spaces.sequence method)": [[6, "gymnasium.spaces.Sequence.sample", false]], "sample() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.sample", false]], "sample() (gymnasium.spaces.text method)": [[7, "gymnasium.spaces.Text.sample", false]], "sample() (gymnasium.spaces.tuple method)": [[6, "gymnasium.spaces.Tuple.sample", false]], "save_video() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.save_video", false]], "seed() (gymnasium.spaces.box method)": [[7, "gymnasium.spaces.Box.seed", false]], "seed() (gymnasium.spaces.dict method)": [[6, "gymnasium.spaces.Dict.seed", false]], "seed() (gymnasium.spaces.discrete method)": [[7, "gymnasium.spaces.Discrete.seed", false]], "seed() (gymnasium.spaces.graph method)": [[6, "gymnasium.spaces.Graph.seed", false]], "seed() (gymnasium.spaces.multibinary method)": [[7, "gymnasium.spaces.MultiBinary.seed", false]], "seed() (gymnasium.spaces.multidiscrete method)": [[7, "gymnasium.spaces.MultiDiscrete.seed", false]], "seed() (gymnasium.spaces.oneof method)": [[6, "gymnasium.spaces.OneOf.seed", false]], "seed() (gymnasium.spaces.sequence method)": [[6, "gymnasium.spaces.Sequence.seed", false]], "seed() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.seed", false]], "seed() (gymnasium.spaces.text method)": [[7, "gymnasium.spaces.Text.seed", false]], "seed() (gymnasium.spaces.tuple method)": [[6, "gymnasium.spaces.Tuple.seed", false]], "sequence (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Sequence", false]], "set_attr() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.set_attr", false]], "set_attr() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.set_attr", false]], "set_wrapper_attr() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.set_wrapper_attr", false]], "shape (gymnasium.spaces.space property)": [[5, "gymnasium.spaces.Space.shape", false]], "single_action_space (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.single_action_space", false]], "single_observation_space (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.single_observation_space", false]], "space (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Space", false]], "spec (gymnasium.env attribute)": [[2, "gymnasium.Env.spec", false]], "spec (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.spec", false]], "spec (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.spec", false]], "spec() (in module gymnasium)": [[4, "gymnasium.spec", false]], "state_info() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.state_info", false]], "step() (gymnasium.env method)": [[2, "gymnasium.Env.step", false]], "step() (gymnasium.envs.functional_jax_env.functionaljaxenv method)": [[3, "gymnasium.envs.functional_jax_env.FunctionalJaxEnv.step", false]], "step() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.step", false]], "step() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.step", false]], "step() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.step", false]], "step() (gymnasium.vector.vectorwrapper method)": [[14, "gymnasium.vector.VectorWrapper.step", false]], "step() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.step", false]], "step_api_compatibility() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.step_api_compatibility", false]], "stickyaction (class in gymnasium.wrappers)": [[16, "gymnasium.wrappers.StickyAction", false]], "syncvectorenv (class in gymnasium.vector)": [[12, "gymnasium.vector.SyncVectorEnv", false]], "terminal() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.terminal", false]], "text (class in gymnasium.spaces)": [[7, "gymnasium.spaces.Text", false]], "timeawareobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.TimeAwareObservation", false]], "timelimit (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.TimeLimit", false]], "to_jsonable() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.to_jsonable", false]], "transform() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.transform", false]], "transformaction (class in gymnasium.wrappers)": [[16, "gymnasium.wrappers.TransformAction", false]], "transformaction (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.TransformAction", false]], "transformobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.TransformObservation", false]], "transformobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.TransformObservation", false]], "transformreward (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.TransformReward", false]], "transformreward (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.TransformReward", false]], "transition() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.transition", false]], "transition_info() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.transition_info", false]], "tuple (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Tuple", false]], "unflatten() (in module gymnasium.spaces.utils)": [[8, "gymnasium.spaces.utils.unflatten", false]], "unwrapped (gymnasium.env property)": [[2, "gymnasium.Env.unwrapped", false]], "unwrapped (gymnasium.vector.vectorenv property)": [[10, "gymnasium.vector.VectorEnv.unwrapped", false]], "unwrapped (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.unwrapped", false]], "vectoractionwrapper (class in gymnasium.vector)": [[14, "gymnasium.vector.VectorActionWrapper", false]], "vectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.VectorEnv", false]], "vectorizetransformaction (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.VectorizeTransformAction", false]], "vectorizetransformobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.VectorizeTransformObservation", false]], "vectorizetransformreward (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.VectorizeTransformReward", false]], "vectorobservationwrapper (class in gymnasium.vector)": [[14, "gymnasium.vector.VectorObservationWrapper", false]], "vectorrewardwrapper (class in gymnasium.vector)": [[14, "gymnasium.vector.VectorRewardWrapper", false]], "vectorwrapper (class in gymnasium.vector)": [[14, "gymnasium.vector.VectorWrapper", false]], "wrapper (class in gymnasium)": [[15, "gymnasium.Wrapper", false]], "wrapper_spec() (gymnasium.wrapper class method)": [[15, "gymnasium.Wrapper.wrapper_spec", false]], "wrapperspec (class in gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.WrapperSpec", false]], "write_to_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.write_to_shared_memory", false]]}, "objects": {"gymnasium": [[16, 0, 1, "", "ActionWrapper"], [2, 0, 1, "", "Env"], [18, 0, 1, "", "ObservationWrapper"], [19, 0, 1, "", "RewardWrapper"], [15, 0, 1, "", "Wrapper"], [4, 4, 1, "", "make"], [4, 4, 1, "", "make_vec"], [4, 4, 1, "", "pprint_registry"], [4, 4, 1, "", "register"], [5, 5, 0, "-", "spaces"], [4, 4, 1, "", "spec"], [15, 5, 0, "-", "wrappers"]], "gymnasium.ActionWrapper": [[16, 1, 1, "", "action"]], "gymnasium.Env": [[2, 2, 1, "", "action_space"], [2, 1, 1, "", "close"], [2, 2, 1, "", "metadata"], [2, 3, 1, "", "np_random"], [2, 3, 1, "", "np_random_seed"], [2, 2, 1, "", "observation_space"], [2, 1, 1, "", "render"], [2, 2, 1, "", "render_mode"], [2, 1, 1, "", "reset"], [2, 2, 1, "", "spec"], [2, 1, 1, "", "step"], [2, 3, 1, "", "unwrapped"]], "gymnasium.ObservationWrapper": [[18, 1, 1, "", "observation"]], "gymnasium.RewardWrapper": [[19, 1, 1, "", "reward"]], "gymnasium.Wrapper": [[15, 3, 1, "", "action_space"], [15, 1, 1, "", "close"], [15, 2, 1, "", "env"], [15, 1, 1, "", "get_wrapper_attr"], [15, 3, 1, "", "metadata"], [15, 3, 1, "", "np_random"], [15, 3, 1, "", "np_random_seed"], [15, 3, 1, "", "observation_space"], [15, 1, 1, "", "render"], [15, 1, 1, "", "reset"], [15, 1, 1, "", "set_wrapper_attr"], [15, 3, 1, "", "spec"], [15, 1, 1, "", "step"], [15, 3, 1, "", "unwrapped"], [15, 1, 1, "", "wrapper_spec"]], "gymnasium.envs.functional_jax_env": [[3, 0, 1, "", "FunctionalJaxEnv"]], "gymnasium.envs.functional_jax_env.FunctionalJaxEnv": [[3, 1, 1, "", "render"], [3, 1, 1, "", "reset"], [3, 1, 1, "", "step"]], "gymnasium.envs.registration": [[4, 0, 1, "", "EnvSpec"], [4, 0, 1, "", "WrapperSpec"], [4, 2, 1, "", "current_namespace"], [4, 4, 1, "", "find_highest_version"], [4, 4, 1, "", "get_env_id"], [4, 4, 1, "", "load_env_creator"], [4, 4, 1, "", "namespace"], [4, 4, 1, "", "parse_env_id"], [4, 2, 1, "", "registry"]], "gymnasium.experimental.functional": [[3, 0, 1, "", "FuncEnv"]], "gymnasium.experimental.functional.FuncEnv": [[3, 1, 1, "", "initial"], [3, 1, 1, "", "observation"], [3, 1, 1, "", "render_close"], [3, 1, 1, "", "render_image"], [3, 1, 1, "", "render_init"], [3, 1, 1, "", "reward"], [3, 1, 1, "", "state_info"], [3, 1, 1, "", "terminal"], [3, 1, 1, "", "transform"], [3, 1, 1, "", "transition"], [3, 1, 1, "", "transition_info"]], "gymnasium.spaces": [[7, 0, 1, "", "Box"], [6, 0, 1, "", "Dict"], [7, 0, 1, "", "Discrete"], [6, 0, 1, "", "Graph"], [7, 0, 1, "", "MultiBinary"], [7, 0, 1, "", "MultiDiscrete"], [6, 0, 1, "", "OneOf"], [6, 0, 1, "", "Sequence"], [5, 0, 1, "", "Space"], [7, 0, 1, "", "Text"], [6, 0, 1, "", "Tuple"]], "gymnasium.spaces.Box": [[7, 1, 1, "", "is_bounded"], [7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.Dict": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.Discrete": [[7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.Graph": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.MultiBinary": [[7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.MultiDiscrete": [[7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.OneOf": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.Sequence": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.Space": [[5, 1, 1, "", "contains"], [5, 3, 1, "", "dtype"], [5, 1, 1, "", "from_jsonable"], [5, 3, 1, "", "is_np_flattenable"], [5, 3, 1, "", "np_random"], [5, 1, 1, "", "sample"], [5, 1, 1, "", "seed"], [5, 3, 1, "", "shape"], [5, 1, 1, "", "to_jsonable"]], "gymnasium.spaces.Text": [[7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.Tuple": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.utils": [[8, 4, 1, "", "flatdim"], [8, 4, 1, "", "flatten"], [8, 4, 1, "", "flatten_space"], [8, 4, 1, "", "unflatten"]], "gymnasium.utils.env_checker": [[9, 4, 1, "", "check_env"]], "gymnasium.utils.ezpickle": [[9, 0, 1, "", "EzPickle"]], "gymnasium.utils.performance": [[9, 4, 1, "", "benchmark_init"], [9, 4, 1, "", "benchmark_render"], [9, 4, 1, "", "benchmark_step"]], "gymnasium.utils.play": [[9, 0, 1, "", "PlayPlot"], [9, 0, 1, "", "PlayableGame"], [9, 4, 1, "", "play"]], "gymnasium.utils.play.PlayPlot": [[9, 1, 1, "", "callback"]], "gymnasium.utils.play.PlayableGame": [[9, 1, 1, "", "process_event"]], "gymnasium.utils.save_video": [[9, 4, 1, "", "capped_cubic_video_schedule"], [9, 4, 1, "", "save_video"]], "gymnasium.utils.seeding": [[9, 4, 1, "", "np_random"]], "gymnasium.utils.step_api_compatibility": [[9, 4, 1, "", "convert_to_done_step_api"], [9, 4, 1, "", "convert_to_terminated_truncated_step_api"], [9, 4, 1, "", "step_api_compatibility"]], "gymnasium.vector": [[11, 0, 1, "", "AsyncVectorEnv"], [12, 0, 1, "", "SyncVectorEnv"], [14, 0, 1, "", "VectorActionWrapper"], [10, 0, 1, "", "VectorEnv"], [14, 0, 1, "", "VectorObservationWrapper"], [14, 0, 1, "", "VectorRewardWrapper"], [14, 0, 1, "", "VectorWrapper"]], "gymnasium.vector.AsyncVectorEnv": [[11, 1, 1, "", "call"], [11, 1, 1, "", "close"], [11, 1, 1, "", "get_attr"], [11, 3, 1, "", "np_random"], [11, 3, 1, "", "np_random_seed"], [11, 1, 1, "", "reset"], [11, 1, 1, "", "set_attr"], [11, 1, 1, "", "step"]], "gymnasium.vector.SyncVectorEnv": [[12, 1, 1, "", "call"], [12, 1, 1, "", "close"], [12, 1, 1, "", "get_attr"], [12, 3, 1, "", "np_random"], [12, 3, 1, "", "np_random_seed"], [12, 1, 1, "", "reset"], [12, 1, 1, "", "set_attr"], [12, 1, 1, "", "step"]], "gymnasium.vector.VectorActionWrapper": [[14, 1, 1, "", "actions"]], "gymnasium.vector.VectorEnv": [[10, 2, 1, "", "action_space"], [10, 1, 1, "", "close"], [10, 2, 1, "", "closed"], [10, 2, 1, "", "metadata"], [10, 3, 1, "", "np_random"], [10, 3, 1, "", "np_random_seed"], [10, 2, 1, "", "num_envs"], [10, 2, 1, "", "observation_space"], [10, 1, 1, "", "render"], [10, 2, 1, "", "render_mode"], [10, 1, 1, "", "reset"], [10, 2, 1, "", "single_action_space"], [10, 2, 1, "", "single_observation_space"], [10, 2, 1, "", "spec"], [10, 1, 1, "", "step"], [10, 3, 1, "", "unwrapped"]], "gymnasium.vector.VectorObservationWrapper": [[14, 1, 1, "", "observations"]], "gymnasium.vector.VectorRewardWrapper": [[14, 1, 1, "", "rewards"]], "gymnasium.vector.VectorWrapper": [[14, 1, 1, "", "close"], [14, 1, 1, "", "render"], [14, 1, 1, "", "reset"], [14, 1, 1, "", "step"]], "gymnasium.vector.utils": [[13, 4, 1, "", "CloudpickleWrapper"], [13, 4, 1, "", "batch_space"], [13, 4, 1, "", "clear_mpi_env_vars"], [13, 4, 1, "", "concatenate"], [13, 4, 1, "", "create_empty_array"], [13, 4, 1, "", "create_shared_memory"], [13, 4, 1, "", "iterate"], [13, 4, 1, "", "read_from_shared_memory"], [13, 4, 1, "", "write_to_shared_memory"]], "gymnasium.wrappers": [[18, 0, 1, "", "AddRenderObservation"], [17, 0, 1, "", "ArrayConversion"], [17, 0, 1, "", "AtariPreprocessing"], [17, 0, 1, "", "Autoreset"], [16, 0, 1, "", "ClipAction"], [19, 0, 1, "", "ClipReward"], [18, 0, 1, "", "DelayObservation"], [18, 0, 1, "", "DtypeObservation"], [18, 0, 1, "", "FilterObservation"], [18, 0, 1, "", "FlattenObservation"], [18, 0, 1, "", "FrameStackObservation"], [18, 0, 1, "", "GrayscaleObservation"], [17, 0, 1, "", "HumanRendering"], [17, 0, 1, "", "JaxToNumpy"], [17, 0, 1, "", "JaxToTorch"], [18, 0, 1, "", "MaxAndSkipObservation"], [18, 0, 1, "", "NormalizeObservation"], [19, 0, 1, "", "NormalizeReward"], [17, 0, 1, "", "NumpyToTorch"], [17, 0, 1, "", "OrderEnforcing"], [17, 0, 1, "", "PassiveEnvChecker"], [17, 0, 1, "", "RecordEpisodeStatistics"], [17, 0, 1, "", "RecordVideo"], [17, 0, 1, "", "RenderCollection"], [16, 0, 1, "", "RescaleAction"], [18, 0, 1, "", "RescaleObservation"], [18, 0, 1, "", "ReshapeObservation"], [18, 0, 1, "", "ResizeObservation"], [16, 0, 1, "", "StickyAction"], [18, 0, 1, "", "TimeAwareObservation"], [17, 0, 1, "", "TimeLimit"], [16, 0, 1, "", "TransformAction"], [18, 0, 1, "", "TransformObservation"], [19, 0, 1, "", "TransformReward"]], "gymnasium.wrappers.vector": [[14, 0, 1, "", "ArrayConversion"], [14, 0, 1, "", "ClipAction"], [14, 0, 1, "", "ClipReward"], [14, 0, 1, "", "DictInfoToList"], [14, 0, 1, "", "DtypeObservation"], [14, 0, 1, "", "FilterObservation"], [14, 0, 1, "", "FlattenObservation"], [14, 0, 1, "", "GrayscaleObservation"], [14, 0, 1, "", "JaxToNumpy"], [14, 0, 1, "", "JaxToTorch"], [14, 0, 1, "", "NormalizeObservation"], [14, 0, 1, "", "NormalizeReward"], [14, 0, 1, "", "NumpyToTorch"], [14, 0, 1, "", "RecordEpisodeStatistics"], [14, 0, 1, "", "RescaleAction"], [14, 0, 1, "", "RescaleObservation"], [14, 0, 1, "", "ReshapeObservation"], [14, 0, 1, "", "ResizeObservation"], [14, 0, 1, "", "TransformAction"], [14, 0, 1, "", "TransformObservation"], [14, 0, 1, "", "TransformReward"], [14, 0, 1, "", "VectorizeTransformAction"], [14, 0, 1, "", "VectorizeTransformObservation"], [14, 0, 1, "", "VectorizeTransformReward"]]}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "method", "Python method"], "2": ["py", "attribute", "Python attribute"], "3": ["py", "property", "Python property"], "4": ["py", "function", "Python function"], "5": ["py", "module", "Python module"]}, "objtypes": {"0": "py:class", "1": "py:method", "2": "py:attribute", "3": "py:property", "4": "py:function", "5": "py:module"}, "terms": {"": [1, 2, 3, 5, 6, 7, 9, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 161, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "0": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 158, 159, 161, 163, 165, 166, 167, 173, 174, 175, 177, 178], "00": [2, 10, 18], "000": 163, "00000000e": [10, 18], "00048403": 14, "000635": [10, 14], "00080468": 14, "0008876301247721108": 19, "001": [133, 135, 140, 163, 174, 178], "00105192": 14, "00127": 14, "00133522": 14, "00142543": 14, "0015": 134, "002": [18, 139, 147, 169], "00209899": 14, "00214607": 11, "0025": [133, 134], "00266526": 14, "003": 140, "00372536": 14, "00395268": 14, "005": [144, 145, 178], "00529102": 14, "00545912": 14, "0059888": 18, "00611216": [10, 18], "00614867": 14, "00615723": 14, "00624371": 14, "00708": 6, "00711833": 6, "00715587": 14, "007812": 14, "008": [139, 147], "00848456": 10, "00942293": 10, "00987654": 158, "01": [2, 10, 14, 16, 18, 129, 137, 138, 141, 142, 143, 144, 145, 146, 155, 156, 159, 163, 169, 174, 178], "010162116476634746": 19, "01098382": [10, 14], "01162461": 10, "01234567": 158, "0123456789": 7, "0123456789abcdefghijklmnopqrstuvwxyzabcdefghijklmnopqrstuvwxyz": 7, "01431748": 10, "01456789": 158, "015": 140, "01522993": 10, "01734283": [10, 16], "01823519": [10, 14, 16, 18], "0197368": [10, 18], "02": [10, 18, 145, 155, 156, 163], "0203607": 16, "0219676": 14, "02345678": 158, "02418869": 10, "024251968": 14, "02438": 178, "02480598": [10, 14], "02727336": [10, 18], "02728892": 16, "0273956": [10, 18], "02796401": [10, 14, 16, 18], "02852531": [10, 14], "02858594": [10, 14], "02859527": [10, 16], "029028230434438706": 14, "02909703": 10, "03": [14, 129, 155, 156], "03156282": [10, 14, 16, 18], "03203924": [10, 14], "0333221090036294": 14, "03332211": 14, "03359492141887935": 14, "03392126": 10, "03516225": 10, "03517495": [10, 14], "03525399": 16, "03585979": [10, 18], "03625453": [10, 18], "03647037": 132, "03774345": 10, "03812904": 16, "03822722": 10, "04": [14, 16, 146, 155], "0446179": [10, 14, 16, 18], "04562247": 10, "0469136": [10, 14], "0469184": 10, "04731862": 10, "04740972": 10, "04794393": 16, "04799704": 10, "05": [14, 132, 137, 138, 141, 144, 155, 156, 163, 169], "055928": 14, "05592803": 132, "06": [155, 156], "06296527": 14, "06296527291998574": 14, "0631256": 14, "06312564": 132, "0640786": 14, "06540678": 18, "06670535": 16, "07": [133, 134, 155, 156], "07287608": 131, "07422512": 18, "08": [155, 156], "0808398": 11, "08227695": 18, "0892358": [14, 132], "09": [155, 156], "09417735": 13, "09613613": 18, "0_": [137, 138, 142, 144], "0_2": [144, 145], "0_3": 144, "0a2": 132, "0th": 17, "0x7f04efcb8850": 158, "0x7fbb5efd0490": 15, "1": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159, 161, 163, 165, 166, 167, 173, 174, 175, 177, 178], "10": [6, 7, 14, 17, 18, 127, 129, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 150, 151, 152, 154, 155, 156, 158, 159, 160, 161, 163, 165, 174, 177, 178], "100": [6, 8, 14, 17, 127, 128, 129, 131, 134, 139, 144, 148, 151, 152, 153, 161, 163, 169, 173], "1000": [9, 17, 128, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 157, 161, 163, 169, 177, 178], "1006": 156, "1009": 156, "100_000": [163, 174], "1013": 156, "10172354684460168": 14, "10172355": 14, "1018": 156, "1019": 156, "1027": 156, "1033": 156, "105": [137, 156], "107": 137, "1075": 156, "1086": 156, "1087": 156, "1094": 156, "1095": 156, "10_000": 161, "10th": 160, "10x": 174, "11": [14, 137, 138, 139, 140, 141, 144, 147, 150, 151, 152, 155, 174, 178], "110": 156, "1105": 156, "1107": 156, "1109": 156, "11185605": 131, "1119": 156, "112": 156, "1120": 156, "11448676": 14, "117": 156, "12": [8, 16, 17, 18, 129, 131, 132, 137, 138, 139, 140, 141, 144, 147, 151, 152, 156, 163, 173, 174, 178], "120": 178, "12224312": [11, 12], "1229": 156, "123": [2, 6, 10, 11, 14, 16, 17, 18, 19, 131, 132, 133, 134, 135, 156, 160, 175], "1230": 156, "124": 156, "1240": 156, "1243": 156, "125": 156, "1250": 156, "1253": 156, "125637": 6, "1260": 156, "12625128": 131, "1264": 156, "1271": 156, "128": 178, "1280": 136, "1283": 156, "1285": 156, "1288": 156, "1289": 156, "1291": 156, "1293": 156, "1294": 156, "1297": 156, "1299": 156, "13": [137, 138, 140, 141, 144, 147, 154, 155, 156], "130": [140, 141, 156], "1304": 156, "1306": 156, "1308": 156, "1310": 156, "1312": 156, "1315": 156, "1319": 156, "132": [151, 152, 156], "1328": 156, "1329": 156, "1333": 156, "1334": 156, "136": 156, "1361": 156, "1378": 156, "138": 156, "1387": 156, "139": 156, "1393": 156, "1396": 156, "14": [137, 138, 140, 141, 144, 147, 155, 156, 174], "141": 156, "1415927": 127, "143": 156, "145": 137, "1455": 17, "146": 156, "14995256": [11, 12], "15": [8, 16, 17, 18, 19, 129, 137, 138, 140, 141, 144, 147, 153, 161, 175, 178], "150": [9, 173], "1500": 155, "1506": 178, "15089367": [10, 16], "1511158": 18, "155": 156, "1598639586606745": 14, "16": [135, 137, 138, 140, 141, 144, 147, 153, 155, 156, 174, 177], "160": 156, "1600": 127, "1613": 154, "164": 156, "16717631": 10, "17": [137, 138, 140, 141, 144, 147, 150, 155], "17032": 156, "171": 156, "1710671": 10, "172": 156, "173": 156, "174": 156, "17752565": 131, "178": 156, "179": 156, "18": [18, 137, 138, 140, 141, 144, 147, 155], "1800": 175, "183": 156, "184": 156, "1851753": 11, "186": 156, "1878752": 12, "18847767": 10, "18879032e": [10, 18], "1887903e": 2, "18933342": 6, "19": [137, 140, 141, 144, 178], "190": 156, "19049619": 6, "1938739": 14, "195": [156, 169], "19559774": 10, "199": 9, "1990": [133, 134], "1995": 131, "1996": 131, "1_": 145, "1b15": 155, "1d": [158, 159, 177], "1e": [14, 18, 19, 139, 140, 141, 146, 147, 177], "1f": 161, "2": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 158, 159, 161, 163, 165, 166, 167, 173, 174, 175, 177, 178], "20": [129, 137, 140, 141, 144, 154, 156, 174, 175, 178], "200": [9, 17, 129, 131, 132, 133, 135, 153, 154, 156, 161], "2000": [9, 127, 154, 175], "2004": 177, "200th": 17, "2014": 128, "2016": 178, "2017": 155, "20172954": 18, "2018": [16, 17, 131, 155], "2019": 155, "2020": [148, 150, 151, 152], "2021": [136, 148, 155], "2022": [136, 155, 156], "2023": 156, "2024": 156, "2025": 156, "205": 156, "206": 156, "208": 156, "20946532": 14, "2095": 132, "21": [18, 19, 137, 140, 141, 144, 150, 156, 163, 174, 178], "210x180": 17, "215": 156, "216": 156, "21649833": 6, "218": 156, "219": 156, "21944423": 14, "22": [17, 137, 140, 141, 144, 156, 174], "220": 174, "221": 156, "223": 156, "224": 156, "225": 156, "227": 154, "229": 177, "23": [137, 140, 141, 144, 156, 161], "230": 156, "234": 156, "235": 156, "235794": 6, "2359734": 14, "238": 156, "24": [14, 17, 18, 127, 128, 129, 132, 137, 140, 141, 156, 174], "24002443": 10, "2407": 156, "241": 156, "244": 156, "24503504": 14, "2456": 155, "246": 156, "247": 156, "2487226": 10, "249": 156, "25": [2, 8, 10, 17, 19, 137, 139, 140, 141, 147, 154, 156, 161, 169], "250": [156, 161], "250th": 161, "252": 156, "2524": 155, "254": 156, "255": [17, 18, 128, 156, 165], "25533703": 18, "256": 177, "257": 156, "25715804": 10, "258": 156, "259": 156, "25g": 137, "26": [2, 17, 137, 140, 141, 166, 177], "26141977": 10, "264": 156, "264d": 169, "267": 156, "2671": 155, "2678": 155, "268": 156, "2684": 155, "27": [9, 19, 140, 141], "270": 156, "272": 156, "2736044": 135, "274": [131, 156], "274334": 131, "27648": [14, 18, 158], "277": 156, "278": 156, "27800309628058434": 14, "279": 156, "28": [14, 131, 140, 141], "281": 156, "282": 156, "2831855": 129, "284": 156, "29": [17, 140, 141, 155, 161], "2906": 155, "292": 156, "2d": [136, 145, 148, 159, 167], "2f": 161, "2gb": 155, "3": [2, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159, 161, 163, 165, 173, 174, 175, 177, 178], "30": [2, 9, 17, 140, 141, 154, 156], "300": [127, 154, 159, 165, 175], "3000": 9, "3016": 155, "303": 154, "3034542e": 14, "3036": 155, "3037": 155, "304": 156, "3040": 155, "3041": 155, "3044": 155, "3072": 155, "30759571": 169, "3076": 155, "3080": 155, "3083": 155, "31": [140, 141, 156], "3110827": 10, "3118435e": 14, "3152": 19, "3154": 19, "32": [18, 140, 141, 150, 177, 178], "321": 156, "323": [144, 156], "32351476": 18, "327": [137, 156], "329": 156, "33": [140, 141], "330": 156, "331": 156, "3319138": 10, "332": 156, "33293587": [10, 16], "333": 156, "337": 156, "338": 156, "339": 156, "34": [140, 141], "340": 156, "341": 156, "342": 156, "34641072": 16, "34756234": 16, "348": [140, 141], "35": [140, 141, 156], "350": [140, 141], "355": 156, "36": [6, 140, 141, 151, 152], "37": [140, 141, 156], "373": 156, "38": [140, 141], "39": [140, 141, 156], "3991573": 6, "3d": [136, 137, 140, 141, 148, 159, 174], "3f": 163, "3rd": 136, "3v3": 148, "4": [2, 6, 7, 8, 9, 10, 14, 16, 17, 18, 127, 128, 129, 131, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 156, 158, 159, 161, 163, 165, 167, 173, 174, 177], "40": [140, 141], "400": [18, 154], "403": 156, "404": [154, 156], "405": 156, "407": 156, "41": [140, 141, 156], "4123625": 135, "418": [132, 156, 158], "41887903": [10, 18, 132], "4189": 6, "42": [6, 7, 10, 11, 12, 13, 16, 18, 140, 141, 156, 157, 159, 160, 163, 178], "424": 156, "42683297": 14, "42884544": 14, "429": 156, "43": [140, 141, 163], "433": 156, "435": 156, "4351738": 14, "4354835e": 14, "43887845": 13, "44": [6, 140, 141], "440": 156, "444": 156, "44504836": 14, "44799727": 14, "4488689e": 14, "45": [134, 144, 163], "450": 156, "451": 156, "459": 156, "4624777": 14, "46352962": [14, 133], "46515748": 14, "46543318": 14, "46546045": 14, "46553135": 14, "47": [151, 152], "47037": 6, "47377947": 14, "474": 156, "47599354": 14, "47de": 169, "48": [151, 152, 163], "480": 136, "4808415e": 16, "482": 156, "48468155": 14, "48657528": 14, "487": 156, "49": 163, "491": 156, "495": 156, "497": 156, "498371": 14, "4x12": [151, 152], "4x4": 153, "4\u03c0": 131, "5": [6, 7, 8, 9, 10, 13, 14, 16, 17, 18, 19, 127, 128, 129, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 154, 159, 163, 165, 173, 174, 175, 177, 178], "50": [17, 129, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 163, 177], "500": [17, 18, 131, 132, 154, 155, 158, 161, 163, 174, 178], "5000": 173, "503": 156, "51": [6, 156], "510": 156, "512": [156, 165], "515": 156, "516": 156, "518": 156, "520": 156, "522": 156, "524": 156, "525": 156, "5281": 156, "529": 156, "533": 156, "5342437e": 14, "535": 156, "536": 156, "538": 156, "54": 6, "540": 156, "5420062": 16, "548": 156, "55": [6, 156], "553": 156, "554": 156, "557": 156, "558": 156, "561": 156, "5635296": 134, "564": 156, "566371": 131, "567": 131, "5676788": 18, "569": 156, "57": 178, "572": 156, "573": 156, "576": 156, "5760367": [11, 12], "58": 156, "580": 156, "581": 156, "583": 156, "5836242": 6, "588": 156, "589": 156, "58922320": 173, "590": 156, "594091": 6, "5e": [137, 139, 140, 141, 147, 169], "5e3": 177, "5gb": 155, "5x": 156, "5x5": [154, 159], "6": [8, 14, 16, 17, 18, 129, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 151, 152, 154, 156, 161, 173, 177], "60": [8, 156], "600": [18, 178], "604": 156, "608": 156, "61": 156, "6102389": 12, "612": 156, "6120394": 18, "616": 156, "6193494": 11, "62": [6, 11, 12], "62259156": 14, "63": [6, 7], "63214064": 6, "634": 156, "6343064e": 14, "6344974": 16, "635": 156, "6382770e": 16, "639": 154, "6397772e": 16, "64": [6, 156], "6608303": 16, "666": 129, "669": 6, "67": 161, "6822636": 6, "683": 156, "68512": 6, "695": 156, "697368": 13, "6fn5ja9uzquzxgkvpwtqjz1eyjcs3hj3": 169, "7": [7, 9, 129, 134, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 156, 169, 178], "70": 156, "708": 156, "709": 156, "714599": 11, "7183299": 18, "72": 156, "720": 136, "7257502": 6, "729": 9, "73": 156, "731": 156, "732": 128, "74": 156, "748": 156, "75": [16, 137, 169], "75cm": 137, "76": 161, "7619033": 14, "762": 156, "7695615": 12, "77": 6, "77395606": 13, "774": 156, "78": [137, 140, 141, 156, 161], "7851154": 11, "788": 156, "789": 156, "791": 156, "79221743": 12, "8": [6, 9, 10, 14, 18, 19, 128, 129, 131, 132, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 153, 155, 156, 158, 159, 173, 175, 177, 178], "80": [153, 154], "800": [156, 175], "8000": 1, "80000019": [10, 18], "80000019e": [10, 18], "8000002e": 2, "801": 156, "81": [11, 12, 135, 156], "810": 156, "811": 156, "812": 156, "8127025": 156, "8127026": 156, "817": 156, "8174238": [11, 12], "81882": 6, "827": 156, "83": 156, "830": 156, "83506": 6, "838": 156, "84": [6, 17], "8498053": 12, "84x84": 17, "85859793": 13, "867": 156, "886": 156, "889": 156, "88g": 137, "89": [6, 156], "8914354": 18, "89235795": 135, "893": 156, "89345848": 14, "8934584807363618": 14, "8971417e": 14, "898": 156, "8f1d43620bc6bb580df6e80b0dc05c48": 131, "8gb": 155, "8x8": 153, "9": [11, 12, 14, 16, 131, 135, 137, 138, 139, 140, 141, 142, 144, 145, 147, 156, 174, 178], "90": 174, "9053838": 6, "9061728": 14, "90849805": 14, "910": 137, "91101986": 135, "91244936": [11, 12], "915": 156, "91g": 137, "9216": 14, "924": 156, "926": [128, 156], "928024": 6, "9296501": 14, "932": 156, "934": 156, "9375233e": 14, "9380709": 16, "941": 156, "9416149": 14, "9428282": 14, "9429494": 14, "95": [128, 163, 173, 174, 175, 178], "9503881": 14, "950912": 6, "952": 156, "9532328e": 14, "956": 156, "957": 156, "958": 156, "959": 156, "96": [14, 18, 128, 158], "9635296": 14, "96495728": 11, "965": 156, "96562607": 12, "96x96": [128, 158], "97562236": 13, "977": 156, "978": 156, "97854": 6, "979": 156, "9808417e": 16, "982": 156, "98219293": 12, "98270553": 11, "9841162": 131, "9886932": [11, 12], "9898634e": 14, "99": [14, 19, 177, 178], "9944268": 18, "997341": 131, "999": [134, 178], "99902063": 12, "9999": 129, "9\u03c0": 131, "A": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 14, 16, 17, 18, 19, 20, 127, 128, 131, 132, 134, 136, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 150, 151, 152, 153, 155, 156, 158, 159, 165, 166, 167, 174, 177, 178], "AND": 160, "And": [165, 169], "As": [2, 5, 10, 15, 17, 131, 132, 136, 149, 151, 152, 155, 156, 158, 159, 162, 167, 175, 177, 178], "At": [14, 17, 158], "Be": 156, "But": [137, 163], "By": [2, 4, 10, 17, 18, 131, 137, 138, 139, 140, 141, 146, 147, 148, 173], "For": [2, 3, 5, 7, 8, 9, 10, 17, 18, 19, 128, 129, 136, 151, 152, 153, 154, 155, 156, 158, 159, 160, 161, 162, 163, 165, 167, 169, 174, 178], "If": [1, 2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 128, 129, 132, 134, 137, 139, 140, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 160, 165, 167, 169, 171, 174, 175, 178], "In": [2, 7, 9, 13, 15, 16, 19, 128, 129, 130, 131, 132, 137, 138, 139, 140, 141, 145, 146, 147, 154, 155, 156, 158, 159, 161, 162, 165, 166, 167, 169, 173, 174, 175, 177, 178], "It": [2, 4, 6, 7, 9, 10, 11, 12, 16, 17, 127, 136, 137, 140, 141, 144, 145, 146, 148, 155, 156, 158, 159, 161, 162, 163, 165, 174, 177], "Its": 148, "No": [16, 17, 18, 150, 155, 159, 160, 177], "Not": [17, 155, 159], "OR": 160, "On": [131, 132, 133, 134, 135, 155, 156, 159, 175], "One": [7, 137, 140, 141, 156, 158, 159], "Or": [154, 160], "Such": [15, 167], "That": [3, 132, 158, 163], "The": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 161, 164, 165, 166, 168, 169, 170, 171, 172, 173, 174, 176, 177, 178], "Then": [1, 15, 159, 160, 165, 167], "There": [7, 15, 127, 129, 130, 133, 134, 136, 140, 142, 148, 151, 152, 154, 155, 156, 165], "These": [9, 126, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 160, 174, 177], "To": [1, 2, 4, 9, 10, 13, 15, 17, 18, 127, 128, 129, 131, 132, 144, 154, 155, 156, 158, 165, 167, 169, 174, 175, 177, 178], "WITH": 173, "Will": [9, 17, 20, 156], "With": [6, 14, 17, 148, 151, 152, 156, 163, 173, 174, 175, 178], "_": [9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 128, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 157, 160, 163, 167, 169, 175, 178], "_2": [137, 138, 139, 140, 141, 144, 145, 146, 147], "__all__": 156, "__class__": 178, "__del__": 156, "__eq__": 155, "__future__": [174, 177, 178], "__get_attr__": 156, "__getattr__": 156, "__getitem__": 155, "__init__": [2, 9, 14, 15, 16, 18, 156, 163, 165, 167, 174, 175, 177, 178], "__len__": 155, "__main__": 178, "__name__": 178, "__setitem__": 155, "_action": 141, "_action_to_direct": [159, 165], "_agent_loc": [159, 165], "_async_work": 11, "_bigint_from_byt": 155, "_build": 1, "_control": 141, "_cost": [140, 141], "_dtypedict": 5, "_episod": [14, 17], "_final_info": 14, "_final_observ": 14, "_get_info": [159, 165], "_get_ob": [159, 165], "_int_list_from_bigint": 155, "_k": 14, "_modul": 18, "_nois": [137, 138, 139, 140, 141, 142, 143, 146, 147], "_np_random": [2, 5, 10, 155], "_np_random_se": [2, 10], "_rang": [140, 141], "_render_fram": 165, "_replac": 175, "_reward_ctrl": 14, "_reward_run": 14, "_scale": [137, 138, 139, 140, 141, 142, 143, 146, 147], "_script": 1, "_static": [1, 173], "_step_mujoco_simul": 156, "_supportsdtyp": 5, "_target_loc": [159, 165], "_timelimit": 155, "_update_running_mean": [14, 19], "_worker": 11, "_x_posit": 14, "_x_veloc": 14, "a2c": [156, 170, 176], "a3c": 178, "a_": [166, 178], "a_0": 6, "a_i": 6, "a_max": 178, "a_min": 178, "a_n": 6, "a_t": 166, "aaronwalsman": 156, "ab": [128, 156, 178], "abbeel": [137, 178], "abdomen": [140, 141], "abdomen_i": [140, 141], "abdomen_x": [140, 141], "abdomen_z": [140, 141], "abil": [156, 158, 162], "abl": [156, 166], "abouelsaadat": 156, "about": [2, 3, 9, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 156, 158, 160, 161, 162, 165, 166, 174, 177], "abov": [2, 6, 7, 9, 131, 132, 135, 136, 156, 158, 161, 177, 178], "absolut": [141, 143, 147, 169], "abstract": [156, 165], "ac": [150, 163, 174], "academ": 162, "academia": 156, "acceler": [128, 133, 134, 135, 148, 155, 156, 178], "accent_r": 174, "accept": [2, 5, 7, 9, 17, 155, 156, 165, 169], "access": [14, 15, 17, 148, 155, 156, 158, 160, 161, 167], "accid": 155, "accident": [155, 156], "accord": [4, 5, 6, 7, 129, 169, 178], "accordingli": 165, "account": [148, 155, 156, 175], "accur": [136, 156, 163], "accuraci": 136, "achiev": [2, 131, 150, 155, 158, 162, 169, 173, 178], "acquir": 136, "acrobot": [130, 155], "acrobotenv": 131, "acronym": 177, "across": [13, 156, 173], "act": [14, 156, 158, 162, 163, 167, 174], "action": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 15, 17, 20, 130, 136, 148, 149, 155, 156, 157, 160, 161, 165, 167, 169, 170, 175, 176, 177, 178], "action_log_prob": 178, "action_logit": 178, "action_logits_vec": 178, "action_mask": [154, 173], "action_masking_taxi": 173, "action_mean": 177, "action_pd": 178, "action_s": 175, "action_shap": 178, "action_spac": [2, 5, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 154, 156, 157, 158, 159, 160, 161, 163, 165, 167, 169, 173, 174, 175, 177], "action_space_dim": 177, "action_stddev": 177, "action_valu": 174, "actionwrapp": [14, 15, 16], "actor": 177, "actor_lay": 178, "actor_loss": 178, "actor_losses_moving_averag": 178, "actor_lr": 178, "actor_optim": 178, "actor_weight": 178, "actor_weights_path": 178, "acttyp": [2, 3, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 156], "actual": [137, 154, 156, 158, 159, 161, 163, 165, 175, 178], "actuat": [131, 132, 140, 141, 156, 169], "acycl": 148, "ad": [14, 16, 17, 18, 19, 129, 132, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 154, 155, 156, 158, 160, 165], "adamw": 177, "adapt": [132, 142, 143, 148, 151, 152, 161], "add": [1, 4, 5, 9, 11, 16, 17, 18, 19, 20, 128, 136, 137, 140, 141, 151, 152, 154, 155, 156, 158, 161, 163, 165, 167, 174, 178], "add_mark": 156, "add_subplot": 174, "addit": [2, 5, 129, 130, 148, 150, 154, 155, 156, 158, 159, 161, 163, 165, 169, 174, 177, 178], "addition": [148, 155, 156], "additional_wrapp": [4, 156], "addrenderobserv": [18, 20, 156], "address": 156, "addwhitenois": 156, "adilzouitin": 155, "adjac": 6, "adjust": [148, 169], "advanc": [11, 131, 148, 156, 161], "advantag": [137, 156, 165], "advis": 14, "affect": [6, 156, 159], "affin": [14, 16, 18, 20, 129], "after": [2, 3, 5, 9, 10, 17, 129, 137, 138, 139, 140, 141, 144, 145, 146, 147, 150, 154, 155, 156, 158, 160, 161, 163, 165, 166, 173, 174, 177, 178], "again": [2, 129, 154, 165], "against": [148, 155], "agent": [2, 4, 5, 14, 17, 20, 127, 128, 129, 133, 137, 138, 139, 140, 141, 142, 143, 145, 146, 147, 148, 155, 156, 159, 160, 162, 165, 166, 167, 173, 175], "agent_i": 159, "agent_posit": 167, "agent_x": 159, "agnost": [137, 138, 139, 140, 141, 146, 147], "ago": 156, "ahead": 155, "ahmedo42": 155, "ai": 148, "aim": [136, 139, 146, 147, 155, 156, 164, 168, 170, 172, 176, 177], "air": [144, 148, 156], "al": [4, 16, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 155, 156, 160, 174], "ale_pi": [17, 156, 160], "alexdluken": 156, "algorithm": [2, 5, 10, 148, 149, 154, 155, 156, 158, 159, 160, 161, 163, 166, 169, 171, 174, 175, 177, 178], "alias": 148, "align": [154, 156, 160], "aliv": [140, 147], "alive_bonu": 142, "all": [2, 4, 5, 6, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 126, 128, 129, 130, 131, 132, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 155, 156, 158, 159, 160, 167, 169, 170, 171, 173, 174, 175, 177, 178], "all_act": 175, "all_stat": 175, "alloc": 159, "allow": [3, 4, 5, 6, 9, 11, 12, 14, 15, 17, 18, 19, 20, 131, 132, 133, 134, 135, 140, 141, 142, 143, 147, 148, 155, 156, 158, 159, 160, 165, 167, 177, 178], "almost": 155, "along": [2, 9, 10, 15, 18, 128, 132, 133, 134, 142, 143, 146, 151, 152, 155, 156, 158], "alongsid": 158, "alpha": [161, 173], "alphabet": 7, "alphanumer": 7, "alreadi": [2, 10, 15, 156, 158], "alreadypendingcallerror": 11, "also": [2, 7, 9, 10, 11, 12, 17, 18, 127, 128, 129, 130, 136, 137, 143, 148, 155, 156, 158, 159, 160, 165, 166, 167, 169, 174, 175, 177, 178], "alter": [2, 15, 156, 158, 165], "altern": [1, 148, 156, 159], "although": [7, 137, 169], "altogeth": 169, "alwai": [7, 8, 17, 129, 133, 134, 137, 140, 141, 142, 145, 146, 150, 151, 152, 153, 156, 158, 163, 165], "amacati": 156, "ambigu": 160, "among": [16, 130, 136], "amount": [9, 127, 132, 142, 143, 177], "amp": 156, "amtamasi": 155, "an": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 165, 166, 167, 169, 171, 173, 175, 178], "analog": 2, "analogi": 144, "analysi": [148, 161], "analyt": 142, "analyz": 161, "anderson": [132, 142, 143], "andrea": [156, 169, 175], "andrew": [133, 134, 156, 175], "andrewtanj": 155, "anerrupt": 156, "angl": [127, 129, 131, 132, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 158, 159], "angle_1": 137, "angle_2": 137, "angle_3": 137, "angle_4": 137, "angular": [127, 129, 131, 132, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "ani": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 20, 129, 132, 137, 139, 140, 142, 143, 146, 147, 148, 153, 155, 156, 158, 159, 165, 166, 169, 174, 175, 177], "anim": [9, 136], "ankle_1": 137, "ankle_2": 137, "ankle_3": 137, "ankle_4": 137, "annot": [155, 156, 174, 175, 177, 178], "annot_kw": 175, "annoy": 156, "anoth": [14, 15, 17, 137, 140, 141, 143, 147, 154, 155, 163, 166, 174, 177], "ansi": [2, 155, 156, 165], "ansi_list": 2, "answer": [148, 163, 165], "ant": [136, 155, 156, 169], "anymor": [14, 18, 19, 155, 156], "anyth": [148, 169, 175], "anytrad": 148, "anywher": [156, 159], "apach": 148, "apart": 165, "api": [2, 3, 14, 17, 20, 148, 155, 156, 157, 158, 164, 165, 166, 168, 169, 170, 178], "apicompat": 156, "appear": [133, 134, 158], "append": [14, 19, 156, 163, 173, 174, 175, 177, 178], "appli": [2, 4, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 127, 129, 130, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 155, 156, 160, 165, 167, 174, 177], "applic": [5, 7, 146, 148, 158, 159, 170, 172, 173, 176], "apply_along_axi": 174, "apply_api_compat": [4, 155, 156], "apply_env_compat": 156, "appreci": 155, "approach": [142, 155, 156, 160, 165, 173, 174, 177], "appropri": [156, 165, 169, 177], "approxim": [14, 19, 148, 163], "ar": [2, 4, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 158, 159, 160, 162, 163, 165, 166, 167, 169, 171, 173, 174, 177, 178], "araffin": 155, "arang": [174, 175, 178], "arbitrari": [2, 4, 7, 9, 148, 178], "arbitrarili": 156, "arcad": [17, 148], "archiv": 155, "archiveprefix": 156, "area": 136, "aren": 155, "arg": [9, 11, 12, 159, 163, 174, 177, 178], "argmax": [154, 163, 173, 174, 175], "argument": [4, 5, 6, 7, 8, 9, 10, 11, 12, 14, 16, 126, 130, 149, 155, 156, 158, 165, 169, 174], "ariel": 156, "arjun": [155, 156], "arm": [136, 140, 141, 144, 145, 148], "around": [3, 14, 126, 148, 155, 163], "arr": [163, 174], "arrai": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 20, 129, 131, 132, 133, 134, 135, 155, 156, 158, 159, 160, 163, 165, 167, 173, 174, 177, 178], "arrang": 4, "array_equ": [159, 165], "arrayconvers": [14, 17, 20, 156], "arraytyp": [10, 11, 12, 14], "arrow": [7, 175], "art": 163, "artemmiyi": 156, "articl": 175, "articul": [146, 148], "artifici": 154, "arxiv": [156, 178], "as_cmap": 175, "ascii": [155, 159], "ask": 159, "aspect": [155, 158, 166], "assert": [156, 165], "assess": 2, "asset": [153, 169], "assign": [2, 132, 133, 134, 144, 145, 148, 156, 174, 175], "assist": 148, "associ": [155, 156, 173], "assum": [7, 14, 18, 136, 156, 165], "assumpt": 160, "async": [4, 11, 156], "asynchron": [5, 10, 11, 12, 156], "asyncvectorenv": [10, 156, 162, 178], "atari": [9, 17, 20, 155, 156, 158, 174], "atari_wrapp": 18, "ataripreprocess": [17, 20, 156], "attach": [129, 132, 135, 137, 142, 143, 147], "attempt": [8, 129, 136, 154, 178], "attitud": 148, "attr": 6, "attribut": [4, 6, 11, 12, 17, 18, 19, 156, 158, 165, 167], "attributeerror": 156, "audio": 156, "augment": [18, 20, 158], "author": [133, 134, 155, 156, 169, 174, 175, 177, 178], "auto": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 156], "autobuild": 1, "autom": [148, 155], "automat": [1, 2, 4, 10, 11, 12, 14, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 155, 156, 163, 165, 178], "automata": [148, 156], "autoreset": [4, 10, 11, 12, 17, 20, 156], "autoreset_mod": [10, 11, 12, 156], "autoresetmod": [10, 11, 12, 156], "autoresetwrapp": [17, 155, 156], "autorom": [155, 156], "aux_1": 137, "aux_2": 137, "aux_3": 137, "aux_4": 137, "auxiliari": [2, 159, 165], "avail": [4, 10, 129, 148, 150, 151, 152, 155, 156, 159, 160, 161, 165, 169, 171, 173], "averag": [9, 14, 19, 20, 161, 163, 166, 174, 175, 177], "average_reward": 163, "avg_length": 161, "avg_rec": 161, "avg_reward": [161, 177], "aviat": 148, "avoid": [10, 13, 15, 151, 152, 154, 158, 159, 169, 173], "awai": [137, 138, 139, 140, 144, 145, 146, 147, 154, 167, 175], "awak": 129, "awar": [148, 156], "award": 132, "ax": [5, 7, 163, 165, 174, 175, 178], "ax1": 174, "ax2": 174, "axb2035": 156, "axi": [17, 18, 133, 134, 137, 140, 141, 146, 173, 174, 175], "ayesh": 156, "b": [1, 7, 144, 145, 154, 155], "b14c": 169, "b2dtut": 128, "b5": 7, "back": [11, 14, 15, 17, 18, 20, 126, 136, 137, 138, 156, 169], "back_leg": 137, "backend": [155, 156, 165], "background": 128, "backlog": 156, "backport": 155, "backward": [138, 155, 156, 177, 178], "bad": [13, 158, 159, 163], "badia": 178, "balanc": [132, 142, 143, 158, 159, 163, 173, 177, 178], "bali": 156, "balisujohn": [155, 156], "bandit": 148, "bar": [9, 163, 178], "bare": 15, "barto": [2, 131, 132, 142, 143, 150, 151, 152, 155, 174, 175], "base": [2, 4, 5, 9, 10, 13, 14, 15, 17, 18, 19, 20, 126, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 154, 155, 156, 158, 159, 163, 165, 167, 169, 173, 174, 177, 178], "base_env": 15, "base_random_se": 173, "baselin": 148, "baselines3": [18, 171], "basemujocoenv": 156, "bash": 155, "basic": [156, 159, 160, 161, 163, 169, 171], "basicconfig": 161, "basilisk": 148, "batch": [5, 10, 11, 12, 13, 14, 155, 178], "batch_spac": [5, 13, 156], "bbox_inch": 173, "bbox_to_anchor": 174, "beanpow": 156, "beat": [148, 150], "beatabl": 174, "becam": 155, "becaus": [136, 160, 163, 165, 167, 169, 173, 174, 178], "becom": [126, 155, 156, 163, 166, 178], "been": [2, 9, 10, 15, 129, 137, 140, 141, 148, 155, 156, 158, 159, 165, 166, 175, 178], "befor": [2, 4, 9, 10, 14, 15, 16, 17, 18, 19, 20, 128, 137, 138, 139, 140, 144, 145, 146, 147, 155, 156, 158, 160, 163, 165, 167, 169, 177, 178], "began": 156, "begin": [14, 17, 155, 158, 159, 160, 165, 174, 178], "beginn": [156, 159], "behav": [155, 161], "behavior": [14, 15, 135, 136, 137, 138, 139, 140, 141, 146, 147, 148, 155, 156, 158, 159, 160, 161, 163, 165, 167, 169], "behaviour": [129, 136, 156], "behind": [2, 137, 140, 156, 160], "being": [3, 4, 6, 7, 8, 17, 129, 133, 134, 135, 137, 140, 141, 144, 145, 155, 156, 158, 159, 163, 169, 174, 175], "believ": 156, "bellman": 163, "belong": 6, "below": [7, 10, 20, 135, 147, 156, 158, 160, 166, 174, 178], "benchmark": [126, 148], "benchmark_init": 9, "benchmark_rend": 9, "benchmark_step": 9, "benefit": [17, 156, 173], "bennet": 148, "besid": 136, "best": [163, 173, 174, 175, 178], "better": [127, 155, 156, 159, 160, 163, 173, 178], "between": [3, 6, 7, 14, 17, 18, 19, 20, 129, 131, 132, 135, 136, 137, 138, 139, 140, 141, 142, 143, 145, 146, 147, 148, 155, 156, 158, 159, 160, 163, 165, 166, 174, 175, 177, 178], "beyond": 156, "bf1797a3": 169, "bfoot": 138, "bia": [137, 138, 139, 140, 141, 146, 147, 178], "bias": [161, 178], "big": [163, 165, 175], "bigger": 175, "biggest": [160, 175], "bike": [158, 163], "binari": [5, 7, 148, 158, 165, 173], "bind": [126, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155], "biomechan": 136, "bipe": 136, "biped": [126, 140, 141, 147, 155, 169], "bipedal_walk": 127, "bipedalwalk": [127, 155], "biplan": 148, "bird": 148, "bit": 155, "bitcraz": 148, "bkrl": 155, "black": [131, 155, 156, 174, 175], "blackjack": [149, 155, 156, 170, 176], "blackjack_q_learn": 174, "blackjackag": [163, 174], "blit": 165, "blob": [151, 152, 155, 169], "block": 156, "blog": [155, 156, 160], "blue": [131, 154, 165, 173, 175], "blueski": 148, "board": 148, "board_gam": 155, "bodi": [129, 136, 137, 138, 139, 140, 141, 142, 144, 146, 147, 169], "boilerpl": [15, 158, 165, 167], "bonu": [147, 178], "book": [131, 150, 151, 152, 155, 174], "book_or_nip": 131, "bool": [2, 4, 5, 6, 7, 9, 10, 11, 12, 14, 15, 17, 18, 132, 136, 137, 138, 139, 140, 141, 146, 147, 163, 165, 173, 174, 175, 177], "bool8": 156, "bool_": 156, "boolean": [2, 5, 9, 14, 17, 129, 156, 174, 177], "booster": 129, "bootstrap": [2, 160, 166, 173, 178], "bot": 148, "both": [7, 10, 11, 12, 18, 127, 130, 131, 147, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 160, 161, 162, 165, 166, 173, 175, 177], "bother": 165, "bottom": [128, 133, 134, 139, 151, 152, 156, 159, 175], "bound": [2, 7, 14, 16, 17, 18, 19, 20, 129, 131, 132, 133, 134, 135, 155, 156, 158, 159, 166], "boundari": 8, "bounded": 5, "box": [2, 5, 6, 7, 8, 10, 11, 13, 14, 15, 16, 17, 18, 20, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 165, 167], "box2d": [127, 128, 129, 155, 156, 158], "brake": 128, "brax": [148, 156], "break": [155, 156, 160, 163, 175], "bridg": 148, "bring": 156, "britojr": 156, "brittl": 177, "broken": [17, 155], "brown": 156, "browser": 1, "bshin": 138, "bsk": 148, "bsuit": 148, "bthigh": 138, "btjanaka": 156, "buffalo": 148, "buffer": [14, 17, 128], "buffer_length": [14, 17, 161, 163, 174, 178], "bug": [17, 129, 136, 137, 139, 140, 142, 143, 144, 145, 147, 153, 155, 156, 160, 163], "build": [5, 126, 137, 138, 139, 140, 141, 142, 143, 146, 147, 148, 156, 158, 161, 165, 167], "built": [13, 148, 155, 156, 159, 162], "bullet": 148, "bump": 155, "bunch": 175, "burden": 177, "bushi": 9, "busi": 158, "bust": [150, 163, 174], "button": [5, 7, 9, 158], "c": [9, 129, 131, 156, 165, 177], "cab": 154, "calcul": [14, 18, 19, 135, 137, 142, 151, 152, 153, 154, 159, 161, 169, 173, 178], "call": [2, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 137, 144, 145, 150, 153, 155, 156, 158, 159, 160, 163, 165, 169, 174, 178], "call_async": 156, "call_wait": 156, "callabl": [3, 4, 9, 11, 12, 13, 14, 16, 17, 18, 19, 156], "callback": [9, 155], "cambridg": [133, 134], "camera": [136, 137, 138, 139, 140, 146, 147], "camera_id": 136, "camera_nam": 136, "campbel": 128, "can": [1, 2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 165, 167, 169, 173, 175, 177, 178], "cannot": [4, 8, 13, 17, 148, 151, 152, 155, 156, 165, 166, 171], "canva": 165, "capabl": [155, 157, 161], "capped_cubic_video_schedul": [9, 17], "captur": [9, 17], "car": [126, 130, 148, 155, 158], "car_rac": [128, 155, 158], "card": [150, 163, 174], "cardin": 159, "care": [5, 148, 163], "carl": 148, "carlo": [163, 174, 177, 178], "carloslui": 155, "carrac": [9, 14, 18, 128, 155, 156, 158], "cart": [130, 142, 143, 158, 177], "cart_posit": 158, "cart_veloc": 158, "cartesian": [6, 7, 135], "cartpol": [2, 9, 10, 14, 16, 17, 18, 19, 130, 132, 136, 142, 143, 148, 155, 156, 158, 160, 161, 163, 171, 177], "cartpoleenv": [17, 132, 156], "cartpolejax": 17, "cartpolevectorenv": [132, 156], "casadi": 148, "case": [2, 3, 5, 6, 7, 13, 14, 16, 128, 137, 138, 139, 140, 141, 146, 147, 154, 156, 158, 159, 160, 165, 166, 167, 169, 177, 178], "casino": [163, 174], "cast": 18, "cat": 138, "catch": [156, 159, 161], "categor": [7, 178], "categori": 1, "caught": 155, "caus": [140, 147, 154, 155, 156, 162, 163], "cbar": 174, "cc": 131, "cclauss": 155, "ccmdp": 148, "cd": 1, "cell": [148, 151, 152, 159, 165], "cellular": [148, 156], "center": [14, 18, 20, 128, 129, 132, 135, 137, 140, 141], "centr": [137, 140, 141], "central": 156, "centric": 177, "certain": [2, 143, 145, 155, 156, 174, 178], "cfrc_ext": [137, 140, 141], "chain": [15, 131, 146, 158], "challeng": [148, 163, 174], "chanc": [11, 148, 154], "chandrasekar": 177, "chang": [1, 2, 3, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 143, 146, 147, 148, 154, 155, 156, 158, 159, 162, 165, 167, 169, 174, 177], "changelog": [4, 155, 156], "channel": [14, 17, 18], "charact": [7, 9], "character": 148, "charg": [6, 148], "charlist": 7, "charraut": 156, "charset": 7, "cheat": 163, "check": [1, 2, 5, 7, 15, 17, 20, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 158, 160, 163, 165, 167, 169, 174, 175], "check_env": [9, 156, 159, 160], "check_environments_match": 156, "checker": [4, 20, 155, 156], "cheetah": 136, "chess": 158, "child": 13, "children": 11, "choic": [158, 159, 173, 175, 177, 178], "choos": [158, 163, 165, 169, 173, 175], "choose_act": 175, "chosen": [2, 7, 151, 152, 175, 178], "chri": 128, "christofkaufmann": 156, "chrisyeh96": 156, "chunk": 17, "ci": [9, 155, 156], "cinert": [140, 141], "circl": 165, "citat": 156, "cite": 156, "civil": 148, "clamp": [140, 141], "clarifi": [155, 156], "clariti": 159, "class": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 14, 15, 17, 18, 19, 136, 148, 155, 156, 158, 159, 162, 163, 165, 167, 169, 174, 175, 177, 178], "classic": [129, 131, 132, 133, 134, 135, 139, 143, 146, 147, 148, 155, 156, 158, 166, 173], "classic_control": [17, 155], "classif": 148, "classmethod": 15, "clean": [2, 148], "cleaner": [154, 160], "cleanup": 155, "clear": [13, 17, 156, 158, 159, 160, 161, 163], "clear_mpi_env_var": 13, "clearer": [2, 155, 161], "clearli": 5, "clementperroud": 156, "cliff": [149, 156], "cliff_walk": [151, 152], "cliffwalk": [151, 152, 155, 156], "cliffwalkingslipperi": 152, "climb": 130, "clip": [14, 16, 19, 20, 133, 134, 137, 156, 158, 159, 165, 167, 178], "clip_reward": 165, "clipact": [14, 16, 20, 158], "clipreward": [10, 14, 19, 20, 156, 167], "clobber": 155, "clock": [161, 165], "clockwis": 135, "clone": [148, 169], "close": [2, 3, 7, 9, 10, 11, 12, 14, 15, 17, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 136, 137, 139, 140, 145, 147, 155, 156, 157, 158, 160, 161, 167, 169, 173, 174, 175, 178], "close_extra": [10, 11, 12], "closechoic": 156, "closer": [129, 150, 156, 163], "closest": 127, "cloudpickl": 13, "cloudpicklewrapp": 13, "cluster": 148, "cmap": [174, 175], "cnt": 156, "co": [131, 133, 134, 135, 142, 145, 148], "coars": 131, "code": [2, 3, 5, 6, 9, 11, 14, 15, 17, 18, 19, 131, 148, 155, 156, 161, 162, 165, 167, 169, 170, 173, 174, 175, 177, 178], "codebas": [156, 160, 165], "coeffici": [146, 178], "coin": 7, "coincid": 165, "col": [151, 152, 153], "cola": 156, "colder": 155, "collabor": 161, "collect": [2, 10, 11, 12, 17, 20, 148, 156, 157, 161, 163, 169, 174, 178], "collector": 156, "collid": 129, "collis": [133, 134, 148, 155], "color": [2, 6, 154, 173], "color_palett": 175, "colour": [128, 155], "column": [4, 163, 175, 177], "com": [19, 140, 141, 151, 152, 153, 155, 165, 169, 171, 175, 177], "combin": [2, 5, 9, 15, 145, 158, 159, 178], "come": [129, 137, 138, 139, 140, 146, 147, 156], "comet": 156, "command": [136, 165], "comment": [136, 155, 156, 178], "commit": [156, 165], "common": [7, 15, 18, 20, 156, 160, 161, 166, 167, 170, 172, 176, 177], "commonli": [20, 155], "commonroad": 148, "commun": [11, 155, 160, 161], "compar": [139, 140, 146, 147, 148, 160, 161, 173, 174, 175, 178], "comparison": [161, 173], "compartment": 156, "compat": [14, 17, 18, 20, 144, 148, 155, 156, 165, 166, 167, 169, 173, 174, 175, 177, 178], "compet": 161, "compil": [148, 155, 162], "compilergym": 148, "complement": 2, "complet": [1, 4, 11, 17, 128, 129, 156, 158, 159, 161, 163, 166, 167, 174], "complex": [5, 6, 136, 140, 141, 142, 143, 148, 156, 158, 160, 161, 162, 177, 178], "compli": 155, "complianc": 155, "compliant": 155, "complic": [7, 15, 160, 167], "compon": [18, 158, 159, 160, 165], "compos": [9, 137, 138, 139, 140, 141, 143, 146, 147], "composit": 7, "compound": 8, "comprehens": [148, 155], "compris": 7, "comput": [2, 3, 9, 14, 18, 19, 20, 136, 137, 155, 156, 159, 161, 163, 165, 173, 174, 177, 178], "computation": [148, 162], "compute_metr": 9, "concat": 175, "concaten": [5, 8, 11, 12, 13, 136, 156], "conceptu": [7, 160, 163], "concern": 177, "conda": [156, 165], "condit": [2, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 166, 169, 174, 177], "conduct": 156, "confid": 161, "config": 4, "configur": [126, 130, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 159, 160, 161, 165, 174, 178], "confirm": [131, 155], "conflict": 9, "congratul": [159, 163], "conjunct": [9, 13], "connect": [2, 6, 11, 131, 137, 138, 139, 140, 141, 145, 146, 147, 148], "connectionist": 177, "consecut": 129, "consequ": [155, 158, 163], "consid": [4, 128, 129, 130, 136, 137, 139, 140, 143, 147, 165, 167, 173], "consist": [3, 7, 127, 129, 131, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 155, 156, 158, 159, 160, 161, 162, 163, 165, 167, 169, 173, 174, 177], "consol": [4, 161], "consolid": 155, "constant": [3, 129, 134, 137, 140, 141, 142, 163], "constantli": 145, "constitu": 6, "constrain": [148, 173], "constraint": [140, 141, 142, 148, 159, 160], "construct": [7, 9, 131, 137, 138, 139, 140, 141, 146, 147, 148], "constructor": [4, 9, 15, 155, 156, 158, 165], "consult": 169, "consumpt": 2, "contact": [127, 129, 136, 137, 140, 141, 142, 155], "contact_cost": [137, 140], "contact_cost_rang": 140, "contact_cost_weight": [137, 140, 169], "contact_force_rang": 137, "contain": [1, 2, 5, 8, 10, 13, 17, 18, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 165, 169, 171, 174, 177, 178], "content": 161, "context": [4, 11, 13, 148, 177], "contextu": 148, "continu": [2, 5, 9, 14, 18, 19, 128, 129, 130, 133, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 158, 159, 166, 174, 177, 178], "continuous_mountaincarenv": 134, "contribut": [126, 148, 156, 171], "contributor": 156, "control": [2, 5, 7, 126, 128, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 163, 167, 169, 175, 178], "conveni": [6, 15, 158, 159, 165], "convent": [1, 2], "converg": [163, 173, 174, 175], "convers": [3, 148, 156], "convert": [1, 5, 6, 14, 17, 18, 20, 129, 148, 155, 156, 159, 160, 174, 175], "convert_to_done_step_api": [9, 160], "convert_to_terminated_truncated_step_api": [9, 160], "convolution_mod": 163, "convolv": [156, 163, 174, 178], "cool": 156, "coordin": [7, 14, 127, 129, 135, 137, 138, 139, 140, 141, 144, 145, 146, 147, 148, 159], "coordinatesof": 142, "copi": [10, 11, 12, 13, 159, 165], "copier": 165, "core": [155, 156, 158, 159, 163], "correct": [4, 9, 10, 16, 129, 148, 154, 155, 156, 158, 160, 163, 165, 166, 177], "correctli": [2, 9, 14, 18, 19, 155, 156, 165, 166], "correspond": [1, 2, 4, 7, 11, 12, 15, 18, 129, 131, 132, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 154, 165, 175, 177, 178], "correspondingli": 128, "cosin": [131, 142, 145], "cost": [127, 156], "could": [2, 9, 14, 137, 138, 139, 140, 141, 143, 146, 147, 156, 158, 159, 160, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "couldn": 160, "coulom": 146, "count": [7, 127, 129, 150, 163, 174], "counter": [135, 156], "coupl": 178, "cours": [148, 175], "cover": [5, 12, 174], "coverag": 148, "cpu": [129, 136, 162, 178], "craft": 129, "craftium": 148, "crash": [129, 158], "crazyfli": 148, "creat": [4, 5, 7, 9, 10, 11, 12, 13, 14, 15, 17, 127, 128, 129, 145, 148, 155, 156, 158, 160, 161, 162, 163, 167, 169, 173, 174, 177, 178], "create_empty_arrai": [5, 13, 156], "create_grid": 174, "create_plot": 174, "create_se": 155, "create_shared_memori": [5, 13], "creation": [2, 4, 156, 160, 165], "creatur": 148, "criteria": [158, 159], "critic": [2, 17, 156], "critic_lay": 178, "critic_loss": 178, "critic_losses_moving_averag": 178, "critic_lr": 178, "critic_optim": 178, "critic_weight": 178, "critic_weights_path": 178, "cross": [151, 152, 153], "crucial": [5, 10, 158, 159, 160], "crypto": 148, "cstride": 174, "ctr_cost": 147, "ctrl_cost": [137, 138, 139, 140, 146, 147], "ctrl_cost_weight": [137, 138, 139, 140, 141, 146, 147, 169], "ctx": 13, "cube": 5, "cuda": [148, 178], "cum_reward": 175, "cumsum": 175, "cumul": [9, 14, 17, 20, 175], "cumulative_reward": 9, "cupi": [14, 17], "current": [2, 4, 7, 9, 10, 17, 18, 128, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 162, 163, 165, 173, 174, 175, 177, 178], "current_col": [151, 152, 153], "current_namespac": 4, "current_q": 163, "current_row": [151, 152, 153], "curriculum": 155, "curv": [155, 161, 173], "custom": [2, 5, 10, 11, 12, 14, 15, 17, 18, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 155, 156, 158, 161, 163, 168, 170], "customis": 148, "customiz": 148, "customspaceerror": 13, "cut": [160, 163], "cvel": [140, 141], "cyaneu": 153, "cylind": 144, "cython": 156, "d": [7, 9, 15, 131, 148, 159, 171, 178], "dac": 148, "dacbench": [148, 156], "daemon": 11, "dag": 148, "dai": 126, "danger": 173, "darkgrid": 177, "data": [5, 8, 9, 10, 15, 148, 155, 156, 158, 159, 161, 162, 163, 165, 167, 174, 175, 177, 178], "data_equival": 156, "data_equivil": 156, "databas": 2, "datafram": [175, 177], "datapoint": 8, "dataset": 156, "datatyp": 155, "david": 175, "davidpl1": 156, "davidslayback": 156, "de": 156, "dead": [155, 156], "deal": [6, 178], "dealer": [150, 155, 163, 174], "dealer_card": 163, "dealer_count": 174, "debug": [2, 5, 9, 148, 149, 155, 156, 158, 160, 161, 163], "decai": [163, 174], "decay_epsilon": [163, 174], "decent": [174, 177], "decid": [150, 156, 175], "decis": [148, 155, 156, 158, 159, 163, 166], "deck": [150, 163, 174], "declar": 159, "decomposit": 154, "decreas": [129, 162, 163, 175], "deep": [148, 155, 162, 166, 171, 175, 177, 178], "deepmind": [136, 155, 169], "def": [9, 14, 156, 159, 163, 165, 167, 169, 173, 174, 175, 177, 178], "default": [2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 155, 156, 158, 159, 165, 166, 169], "default_camera_config": [136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "default_rng": 175, "defaultdict": [163, 174], "defin": [2, 3, 5, 8, 11, 12, 14, 15, 16, 17, 18, 135, 155, 156, 158, 159, 165, 166, 167, 175, 178], "definit": [137, 139, 140, 142, 155, 156, 166], "deform": 148, "deformable_gym": 148, "degre": [11, 140, 141, 142, 167, 178], "delai": [18, 20, 156, 165], "delayobserv": [18, 20, 156], "deleu": 156, "deliv": 154, "delta": [175, 177], "demand": 128, "demo": 1, "demonstr": [14, 127, 148, 161, 169, 173, 178], "dennybritz": [151, 152], "denot": [2, 132, 153], "densiti": [144, 148, 156], "depend": [2, 6, 9, 10, 14, 18, 19, 126, 129, 130, 132, 136, 137, 138, 139, 140, 141, 146, 147, 153, 155, 156, 165, 175, 178], "dependencynotinstal": [9, 17], "deprec": [2, 136, 155, 156], "depreci": 155, "depth": 156, "depth_arrai": 136, "deque_s": [14, 17], "deriv": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 177], "derk": 148, "desc": [153, 175], "describ": [2, 5, 6, 7, 131, 132, 146, 150, 155, 156, 158, 167], "descript": [6, 20, 136, 156, 165], "design": [131, 140, 141, 148, 149, 154, 156, 163], "desir": [9, 14, 154, 159, 169, 178], "despit": 156, "destin": [154, 173], "destroi": [129, 156], "detach": 178, "detail": [5, 6, 7, 9, 19, 131, 148, 155, 156, 158, 159, 161, 163, 165, 169, 173, 178], "detect": [156, 160, 165], "determin": [2, 17, 129, 131, 132, 133, 134, 135, 153, 155, 156, 158, 159, 165, 166, 169], "determinist": [16, 129, 131, 133, 134, 165, 178], "dev": [2, 155, 177], "develop": [136, 148, 155, 156, 160, 161, 163, 171, 177], "deviat": [146, 163, 177, 178], "devic": [14, 17, 156, 178], "devicearrai": 17, "dexter": 148, "dexteroushand": 148, "df1": 177, "di": 160, "diagnost": 2, "diagon": 159, "diagram": 135, "dict": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 18, 20, 136, 151, 152, 153, 154, 155, 156, 158, 159, 160, 165, 173, 177], "dict_info": 14, "dict_kei": 18, "dict_time_kei": 18, "dictat": [128, 129], "dictinfotolist": [10, 14, 20, 156], "dictionari": [2, 5, 6, 7, 9, 10, 14, 18, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 159, 165, 167, 173, 174, 177], "did": [156, 166], "didn": [156, 175], "die": 128, "dietterich": 154, "differ": [2, 5, 6, 9, 11, 12, 16, 17, 18, 128, 135, 136, 147, 148, 155, 156, 158, 159, 160, 161, 163, 165, 166, 167, 169, 170, 172, 173, 175, 176, 178], "differenti": 166, "difficult": [132, 136, 142, 143, 156, 159, 160, 162, 163, 175], "difficulti": [155, 159], "digit": 7, "dim": [140, 141], "dimens": [5, 7, 8, 18, 148, 156, 177], "dimension": [5, 17, 129, 137, 138, 139, 146, 147, 156, 158, 159, 165, 178], "direct": [6, 131, 132, 133, 134, 137, 138, 139, 140, 142, 143, 146, 147, 148, 151, 152, 153, 154, 159, 163, 165, 175, 177], "directli": [2, 6, 10, 15, 17, 131, 136, 158, 159, 165, 174, 177], "directori": [1, 155, 165], "dirhtml": 1, "disabl": [4, 17, 18, 19, 151, 152, 153, 155, 156, 163, 169], "disable_env_check": [4, 16, 17, 155], "disable_logg": 17, "disable_print": 4, "disable_render_order_enforc": [17, 155], "disallow": 154, "disc_to_cont": 167, "discard": 18, "discord": [148, 155, 156, 160, 171], "discount": [14, 19, 160, 163, 166, 174, 175, 177, 178], "discount_factor": [163, 173, 174], "discourag": 155, "discov": [156, 169], "discret": [2, 5, 6, 7, 8, 11, 13, 18, 128, 129, 131, 132, 133, 134, 148, 149, 150, 151, 152, 153, 154, 155, 156, 158, 159, 163, 165, 167, 174], "discrete_act": 165, "discreteact": 167, "discreteenv": 155, "discuss": [155, 156, 159], "displac": [137, 138, 139, 140, 146, 147], "displai": [2, 4, 132, 155, 160, 165], "dissect": 175, "dist": 144, "distanc": [138, 139, 141, 144, 147, 159, 165], "distance_from_origin": [137, 140], "distance_penalti": 142, "distinct": [160, 166], "distinguish": [2, 159, 160, 165, 166], "distrib": 177, "distribut": [5, 6, 7, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 155, 156, 169, 175, 177, 178], "dive": 158, "divers": [148, 157], "dlpack": 156, "do": [4, 7, 13, 15, 17, 128, 129, 131, 155, 156, 158, 159, 161, 163, 165, 167, 169, 175, 177, 178], "doc": [9, 129, 155, 156, 167], "dockerfil": 155, "docstr": [1, 155, 156], "doctest": 156, "document": [5, 7, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 130, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 155, 156, 158, 160, 165, 169, 174, 178], "doe": [2, 6, 8, 9, 10, 11, 12, 13, 15, 17, 18, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 155, 156, 159, 165, 166, 167, 178], "doesn": [1, 2, 4, 15, 17, 129, 155, 156, 159, 166, 175], "dof": [137, 140, 141], "dog": 9, "doi": [154, 156], "domain": [16, 128, 131, 133, 134, 154, 167], "domain_random": 128, "don": [6, 14, 15, 128, 133, 155, 156, 158, 159, 160, 165, 166, 173, 175, 178], "done": [2, 9, 14, 155, 156, 158, 163, 165, 166, 169, 173, 174, 175, 177, 178], "doom": 148, "dot": [6, 7, 165], "doubl": 136, "doublependulum": 142, "down": [5, 7, 128, 141, 148, 150, 151, 152, 153, 154, 156, 159, 163, 165, 166, 173, 174, 175], "download": [165, 166, 167, 170, 173, 174, 175, 177, 178], "downward": 131, "dpi": 173, "dramat": [155, 156], "draw": [6, 150, 163, 165, 174], "drawn": [6, 7, 144, 146, 150, 163], "drive": [128, 173], "driver": 156, "drone": 148, "drop": [154, 156, 173], "drryanhuang": 156, "dry": 159, "dsctt": 155, "dstack": 174, "dt": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 169], "dtype": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 20, 129, 131, 132, 133, 134, 135, 155, 156, 159, 165, 175], "dtypeobserv": [14, 18, 20, 156], "dual": 148, "duburcqa": [155, 156], "duckietown": 148, "due": [2, 129, 132, 136, 153, 155, 156, 158, 160, 163, 166, 178], "dump": 156, "dunbar": 156, "dunder": 156, "duplic": [14, 156], "durat": [9, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 161, 177], "dure": [2, 4, 6, 7, 10, 14, 17, 18, 19, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 160, 165, 167, 169, 173], "dw": 9, "dx": [137, 138, 139, 140, 146, 147], "dylwil3": 156, "dynam": [2, 16, 131, 135, 136, 142, 148, 155, 156, 159, 160], "e": [1, 2, 4, 5, 7, 8, 9, 11, 13, 14, 15, 17, 20, 129, 137, 138, 139, 140, 141, 143, 144, 145, 146, 147, 148, 150, 153, 155, 156, 159, 165, 167, 174, 175, 177, 178], "e3c16072f695": 169, "each": [2, 5, 6, 7, 9, 10, 11, 12, 13, 14, 16, 17, 18, 20, 126, 127, 128, 129, 130, 131, 132, 133, 134, 136, 137, 140, 141, 142, 143, 144, 145, 148, 149, 151, 152, 154, 155, 156, 158, 159, 160, 161, 163, 165, 173, 174, 175, 178], "earli": [126, 161, 163, 174, 177], "earlier": [137, 140, 141, 165], "earliest": 177, "easi": [148, 149, 155, 158, 159, 175], "easier": [130, 155, 156, 158, 159, 178], "easiest": [128, 155, 156], "easili": [6, 10, 15, 148, 155, 156, 162], "east": [154, 173], "ed": 131, "edg": [5, 6, 8, 132, 155, 156, 158, 159, 163], "edge_link": [6, 8], "edge_mask": 6, "edge_spac": [6, 8], "edgecolor": 174, "edit": [148, 155, 165], "educ": 161, "effect": [2, 8, 13, 15, 17, 129, 137, 141, 142, 143, 144, 145, 146, 154, 158, 159, 161, 173, 174, 177], "effector": [144, 145], "effici": [11, 133, 134, 136, 148, 156, 159, 161, 162, 173, 178], "effort": [130, 156], "eg": 165, "egl": 136, "eight": 137, "einforc": 177, "either": [7, 8, 9, 12, 14, 16, 17, 133, 134, 148, 150, 153, 154, 156, 158, 160, 175, 177, 178], "ekalosak": [155, 156], "elaps": [14, 17], "elbow": 144, "electron": 148, "element": [2, 5, 6, 7, 10, 11, 13, 18, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 158, 165, 169, 177, 178], "elev": 169, "eleven": 136, "elf": 153, "elif": [159, 160], "elimin": 173, "elliottow": 156, "elo": 148, "els": [14, 18, 139, 147, 153, 154, 156, 159, 163, 165, 173, 174, 175, 178], "emb": 169, "embed": [161, 169], "emerg": [156, 161], "emit": 2, "emphas": 159, "emploi": 17, "empti": [5, 7, 13, 17, 137, 138, 139, 140, 141, 146, 147, 156, 159, 174, 175, 177], "emul": [155, 160], "en": [18, 177], "enabl": [4, 9, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 128, 148, 155, 156, 160], "enable_wind": [129, 178], "encapsul": 2, "encod": [8, 148, 154, 155, 165], "encompass": 148, "encount": [160, 163, 178], "encourag": [155, 159, 169, 178], "end": [2, 3, 10, 14, 17, 127, 135, 136, 155, 156, 157, 158, 159, 160, 161, 163, 166, 169, 174, 175, 177, 178], "endeavor": 148, "energi": [127, 129, 132, 159, 167], "enforc": [4, 17, 155], "engin": [129, 136, 148, 156], "english": 7, "enough": [159, 169, 178], "ensur": [1, 2, 4, 6, 8, 9, 129, 148, 156, 158, 159, 161, 163, 165, 173, 174], "ent_coef": 178, "enter": [2, 9, 129, 151, 152], "entir": [9, 17, 139, 147, 155, 156, 178], "entiti": 5, "entrain": 148, "entri": [4, 155, 156, 159, 163], "entropi": [2, 178], "entropy_moving_averag": 178, "entry_point": [4, 155, 159, 165], "entrypoint": 165, "enum": [4, 10, 156, 165], "enumer": [173, 175], "env": [4, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 163, 166, 167, 169, 170, 173, 174, 175, 176, 177], "env_check": [9, 155, 156, 159], "env_devic": [14, 17], "env_fn": [11, 12], "env_id": [4, 156, 160], "env_lambda": 9, "env_mask": 173, "env_nam": [4, 161], "env_new": 9, "env_old": 9, "env_spec": 156, "env_spec_kwarg": 156, "env_typ": 1, "env_unmask": 173, "env_xp": [14, 17], "envapicompat": 155, "envcompat": 155, "envcreat": 4, "environ": [4, 5, 7, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 127, 128, 129, 130, 131, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 149, 150, 151, 152, 153, 154, 155, 156, 157, 161, 166, 167, 168, 170, 171, 172, 176, 177], "environment_cr": 165, "environmentnam": 156, "envpool": [155, 156], "envs_wrapp": 178, "envspec": [2, 3, 4, 10, 15, 17, 156], "ep": [175, 177], "ep_action_log_prob": 178, "ep_reward": 178, "ep_value_pr": 178, "episod": [2, 4, 9, 10, 14, 17, 18, 20, 155, 156, 157, 158, 159, 160, 163, 165, 166, 169, 173, 174, 175, 177, 178], "episode_data": 161, "episode_id": 9, "episode_index": 9, "episode_num": 161, "episode_ov": [158, 161], "episode_returns_moving_averag": 178, "episode_reward": [14, 19, 161, 163, 173], "episode_tim": 161, "episode_trigg": [9, 17, 161], "episodestatisticsrecord": 156, "epoch": 178, "eprint": 156, "epsilon": [14, 18, 19, 163, 173, 174, 175], "epsilon_decai": [163, 174], "epsilongreedi": 175, "equal": [11, 12, 129, 133, 134, 139, 144, 147, 150, 153, 154, 163, 175], "equat": [131, 135, 163], "equival": [4, 5, 8, 10, 14, 137, 140, 155, 156, 178], "erez": [139, 140, 141], "ericonaldo": 155, "error": [2, 4, 7, 8, 9, 11, 17, 20, 155, 156, 158, 163, 166, 174, 178], "errorr": 155, "escap": 2, "especi": [5, 160, 165, 167, 178], "essenti": [7, 161, 169], "estim": [19, 137, 160, 163, 166, 177, 178], "estimate_valu": 160, "et": [16, 17], "etc": [2, 5, 10, 14, 17, 137, 138, 139, 140, 146, 147, 155, 156, 158, 159, 160, 161, 165, 166, 167], "euclidean": [144, 145], "ev": 148, "ev2gym": 148, "eval": [161, 178], "eval_env": 160, "evalu": [14, 17, 18, 19, 148, 156, 160, 169, 174], "evanmath": 155, "even": [2, 4, 137, 139, 140, 142, 143, 147, 155, 159, 163, 165, 174], "event": [9, 155, 165], "eventu": [13, 158], "ever": [126, 155], "everi": [1, 5, 6, 9, 14, 17, 18, 19, 128, 129, 132, 137, 139, 140, 142, 143, 147, 156, 158, 159, 160, 165, 173, 177, 178], "everyon": 136, "everyth": [17, 148, 158, 159], "evolv": 9, "exact": [150, 156, 174], "exactli": [8, 146, 158, 159, 161], "exampl": [1, 2, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 128, 131, 136, 148, 150, 151, 152, 153, 155, 156, 158, 161, 163, 165, 166, 167, 169, 170, 172, 173, 174, 176, 178], "examplefuncenv": 156, "exce": [127, 150], "exceed": [2, 17, 20, 158, 174], "excel": 169, "except": [2, 7, 15, 155, 156, 159, 165], "exchang": 158, "excit": 156, "exclud": [4, 17, 20, 137, 138, 139, 140, 141, 142, 145, 146, 147, 154], "exclude_current_positions_from_observ": [137, 138, 139, 140, 141, 146, 147, 169], "exclude_namespac": 4, "exclus": [6, 136, 140, 141, 156], "execut": [1, 9, 16, 154, 158, 159, 165, 177, 178], "exhibit": 136, "exist": [2, 4, 5, 10, 11, 12, 15, 16, 17, 18, 19, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 158, 161, 162, 178], "exist_ok": 173, "exit": [9, 10, 11, 12], "exp": 177, "expand": [5, 7], "expect": [2, 4, 5, 6, 7, 155, 156, 158, 159, 169, 175, 177, 178], "expens": [5, 155], "experi": [17, 136, 137, 140, 141, 142, 143, 148, 158, 159, 163, 174, 175, 177, 178], "experienc": 163, "experiment": [3, 131, 156], "explain": [155, 166], "explan": [174, 177], "explanatori": 174, "explicit": [156, 160], "explicitli": [3, 165, 166, 169], "exploit": [173, 174, 175], "explor": [2, 5, 148, 156, 159, 162, 173, 174, 175, 178], "explor_exploit_tradeoff": 175, "exponenti": [7, 14, 19, 20], "export": 156, "expos": [3, 148, 156], "express": [5, 9, 137, 140, 141], "ext_control": 6, "extend": [2, 17, 137, 156], "extens": [148, 156, 177], "extent": 153, "extern": [2, 137, 140, 141, 155, 156, 160, 166], "extra": [155, 156, 158, 165, 174], "extract": [9, 156, 175], "extrem": [148, 149], "ez": 155, "ezpickl": [4, 9, 15], "f": [153, 158, 159, 161, 163, 173, 174, 175, 177, 178], "f_": [137, 140, 141], "face": [137, 140, 141, 150, 163, 174], "facecolor": 174, "facedown": 150, "facilit": 136, "fact": 177, "factor": [14, 19, 129, 174, 177, 178], "factori": 4, "fail": [156, 158, 160], "failur": [158, 159, 160, 161, 166], "fair": 7, "fairli": [155, 156, 177], "fall": [127, 140, 151, 152, 153, 158, 163, 166, 169, 175], "fallen": [139, 169], "fals": [4, 6, 9, 10, 11, 12, 14, 16, 17, 18, 19, 128, 129, 132, 137, 138, 139, 140, 141, 146, 147, 150, 154, 155, 156, 158, 159, 160, 161, 163, 165, 169, 173, 174, 175, 177, 178], "familiar": 169, "familiaris": 159, "famou": 163, "far": [127, 128, 141, 142, 144, 145, 153, 158], "farama": [10, 11, 12, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 148, 156, 165, 171, 174, 177, 178], "fast": [128, 136, 138, 140, 142, 146, 148, 158, 160, 163], "faster": [127, 129, 137, 140, 141, 142, 145, 156, 163, 173, 178], "fastest": 158, "favor": [2, 155, 156], "favorit": 174, "favour": [2, 155, 156], "featur": [6, 7, 18, 136, 155, 156, 160, 178], "feature_spac": 6, "fed": 178, "feed": 178, "feedback": [156, 158, 159, 163], "feel": [169, 177], "feet": [138, 147], "fetchreach": 160, "few": [1, 131, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 163, 169, 174, 175], "ffffffff": 153, "fffffhff": 153, "fffh": 153, "fffhffff": 153, "fffhfffg": 153, "ffoot": 138, "ffset": 177, "fhffhfhf": 153, "fhfh": 153, "fhhfffhf": 153, "fibonacci": 177, "fickl": [154, 156], "fickle_passeng": 154, "fidel": 148, "field": [156, 162], "fieteo": 155, "fig": [163, 174, 175, 178], "fig1": 174, "fig2": 174, "figaspect": 174, "fight": 148, "figsiz": [161, 163, 173, 174, 175, 177, 178], "figur": [139, 156, 161, 173, 174, 177], "file": [1, 131, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 161, 165, 169], "filenam": [9, 17, 161], "fill": 165, "filter": [14, 18, 20, 158, 173], "filter_kei": [14, 18], "filterobserv": [14, 18, 20], "filterobservationwrapp": 18, "final": [3, 9, 18, 155, 156, 159, 161, 163, 165, 166, 169, 174], "final_epsilon": [163, 174], "final_info": [14, 17, 155, 156], "final_observ": [14, 17, 155, 156], "find": [2, 4, 156, 158, 161, 162, 163, 165, 169, 175], "find_highest_vers": 4, "fine": [165, 178], "finetun": 148, "finfo": 175, "fingertip": [144, 145], "finish": [2, 128, 129, 155, 156, 158, 161, 163, 165, 178], "finit": [6, 7, 137, 143, 147, 166, 167, 177], "fire": 129, "firefoxmetzg": 155, "firmwar": 148, "first": [2, 4, 6, 9, 10, 11, 12, 15, 129, 131, 133, 134, 137, 138, 139, 140, 141, 142, 145, 146, 147, 151, 152, 154, 155, 156, 157, 159, 160, 161, 163, 165, 174, 175, 177], "five": [130, 155, 163, 177], "fix": [5, 6, 7, 14, 17, 19, 20, 129, 131, 132, 135, 136, 137, 138, 139, 140, 142, 143, 144, 145, 147, 148, 150, 153, 155, 156, 158, 159, 160, 165, 177], "fixtur": 145, "flag": [11, 133, 136, 148, 160], "flake8": [155, 156], "flappi": 148, "flat": [5, 6, 7, 8, 169], "flatdim": [5, 8, 155], "flatt": 178, "flatten": [5, 8, 14, 18, 20, 136, 155, 156, 158, 159, 163, 165, 174, 175, 178], "flatten_spac": [5, 8], "flattenobserv": [6, 14, 18, 20, 158, 159, 165], "flesh": 3, "flex": 144, "flexibl": [11, 148, 156, 159], "flight": 148, "float": [4, 7, 8, 9, 14, 16, 17, 18, 19, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 159, 163, 165, 173, 174, 175, 177, 178], "float32": [2, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 167], "float64": [5, 7, 8, 10, 14, 18, 19, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "flow": 148, "fluctuat": 163, "fluid": 146, "fly": [129, 160], "flycraft": 148, "fmt": 175, "fn": 13, "focu": [148, 159, 161, 178], "focus": [163, 171, 173], "foddi": 148, "folder": [1, 9, 17, 156, 161], "follow": [1, 3, 4, 5, 9, 10, 14, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 129, 131, 132, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 159, 165, 166, 167, 169, 174, 175, 177, 178], "fontsiz": [174, 175], "foot": [11, 138, 139, 140, 141, 147], "foot_joint": [139, 147], "foot_left_joint": 147, "forc": [15, 129, 132, 133, 134, 136, 137, 140, 141, 142, 143, 147, 155, 169, 177], "forcibli": 166, "forearm": [140, 141, 144], "forev": 166, "foreverska": 156, "forex": 148, "forg": 165, "forget": [14, 15, 158, 165], "forgot": 159, "fork": [1, 156, 157, 160], "form": [5, 6, 7, 17, 131, 146, 156, 165], "formal": 166, "format": [1, 4, 5, 9, 14, 156, 158, 159, 160, 161, 169], "formerli": 156, "forward": [13, 19, 127, 137, 138, 139, 140, 141, 146, 147, 155, 156, 177, 178], "forward_reward": [137, 138, 139, 140, 146, 147, 169], "forward_reward_weight": [137, 138, 139, 140, 146, 147, 169], "found": [20, 136, 142, 148, 155, 156, 174, 177], "foundat": [148, 156, 165, 171], "four": [128, 129, 137, 139, 148, 154, 156, 158, 159, 174], "foxik": 155, "fp": [2, 9, 10, 17, 129, 156, 165], "frac": [137, 138, 139, 140, 141, 146, 147], "frame": [2, 9, 10, 17, 18, 20, 128, 129, 144, 145, 155, 156, 161, 175], "frame_skip": [17, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 169], "framer": 165, "frameskip": 17, "frameskipobserv": 156, "framestack": [17, 18, 155, 156], "framestackobserv": [17, 18, 20, 156], "frametim": [137, 138, 139, 140, 141, 146, 147], "framework": [14, 17, 20, 136, 148, 156, 169], "franuka": 153, "free": [131, 135, 136, 137, 140, 141, 142, 143, 148, 169, 174, 177], "free_body_rot": 146, "freedom": [140, 141, 142, 167], "freejoint": [140, 141], "freez": [14, 18, 19], "frequenc": 17, "frequent": [155, 166], "friction": [127, 146, 147, 148], "frictionless": 132, "from": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 127, 128, 129, 131, 136, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 160, 161, 162, 163, 166, 169, 173, 174, 175, 177, 178], "from_json": [5, 156], "front": [137, 138, 146, 147], "front_left_leg": 137, "front_right_leg": 137, "frontpag": 156, "frozen": [149, 155, 156, 175], "frozen_lak": [153, 175], "frozenlak": [9, 153, 155, 156, 170, 171, 176], "frozenlake4x4": 156, "frozenlake8x8": [153, 155, 156], "frozenlake_q_learn": 175, "frozenset": 7, "fshin": 138, "fthigh": 138, "fuel": 129, "full": [3, 4, 128, 129, 155, 156, 158, 159, 174], "fulli": [2, 129, 137, 138, 139, 140, 141, 143, 146, 147, 148, 155], "fun": [174, 177], "func": [3, 14, 16, 18, 19, 156], "func_env": 3, "funcenv": [3, 156], "funcjaxenv": 156, "function": [2, 8, 10, 11, 12, 14, 16, 17, 18, 19, 20, 129, 132, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 154, 155, 156, 158, 163, 166, 167, 169, 171, 174, 175, 177, 178], "functional_jax_env": 3, "functionaljaxenv": 3, "fundament": [159, 161, 163, 164, 168, 170], "furcolor": 9, "further": [2, 5, 7, 129, 144, 145, 155, 156, 175, 177], "furthermor": [2, 9, 156, 158], "furthest": 127, "futur": [3, 155, 156, 160, 163, 173], "future_q_valu": [163, 174], "g": [1, 2, 4, 5, 7, 8, 9, 11, 12, 13, 20, 131, 135, 137, 138, 139, 140, 141, 143, 146, 147, 148, 153, 154, 155, 156, 165, 167, 174, 175, 177, 178], "ga": 128, "gae": 178, "gaetanlepag": 156, "gain": [156, 167], "galleri": [1, 156], "game": [7, 9, 17, 126, 150, 151, 152, 153, 155, 156, 158, 159, 160, 163, 165, 174], "gamma": [14, 19, 160, 166, 175, 177, 178], "gap": 148, "garbag": [10, 11, 12, 17, 156], "gather": 165, "gaussian": 136, "gc_trigger": 17, "gcc": 148, "gen_gif": 1, "gen_md": 1, "gener": [1, 2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 13, 15, 17, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 159, 161, 162, 173, 178], "generalis": [2, 10], "generate_random_map": [153, 175], "geometr": [6, 136], "geometri": 156, "get": [2, 4, 11, 12, 14, 15, 18, 19, 127, 129, 136, 137, 139, 140, 142, 150, 155, 156, 158, 159, 161, 165, 166, 169, 173, 174, 175, 178], "get_act": [163, 174], "get_attr": [11, 12, 156], "get_env_id": 4, "get_loss": 178, "get_moving_avg": 163, "get_rect": 165, "get_stat": 155, "get_wrapper_attr": [15, 156], "gianluca": 156, "gianlucadecola": [155, 156], "giant": 163, "gif": [1, 131, 156], "git": [165, 169], "github": [19, 129, 132, 136, 137, 139, 140, 141, 142, 143, 144, 145, 147, 151, 152, 155, 156, 160, 165, 169, 171], "give": [2, 10, 129, 137, 150, 154, 155, 158, 159, 174, 177, 178], "given": [3, 4, 5, 7, 16, 127, 129, 130, 131, 132, 133, 134, 137, 139, 140, 142, 143, 147, 155, 156, 166, 174], "glfw": 136, "global": 4, "gnn": 148, "go": [2, 9, 128, 148, 150, 155, 159, 162, 163, 166, 169, 174, 177, 178], "go1": 169, "goal": [2, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 159, 160, 163, 165, 177], "goal_slidei": 144, "goal_slidex": 144, "goal_veloc": [133, 134], "godsboy404": 156, "goe": [150, 155, 163], "gone": 155, "good": [158, 159, 163, 174, 175, 178], "googl": [155, 169], "goul\u00e3o": 156, "gp": 148, "gpu": [136, 148, 156, 162, 178], "gracefulli": 155, "gradient": [177, 178], "gradual": [158, 161, 163], "grai": 17, "grammat": 156, "grant": 129, "graph": [5, 6, 8, 13, 148, 155, 156, 158, 174, 178], "graphic": [136, 155], "graphinst": [6, 8, 13, 155, 156], "grasp": 148, "grave": 178, "gravit": 129, "graviti": [129, 132, 133, 135, 142, 143, 148, 177, 178], "grayscal": [14, 17, 18, 20], "grayscale_env": 18, "grayscale_newaxi": 17, "grayscale_ob": 17, "grayscaleobserv": [14, 18, 20], "great": [148, 167, 174], "greater": [129, 131, 132, 133, 134, 143, 150, 174], "greedi": [163, 173, 174, 175], "greedili": 174, "green": [131, 154], "grei": 174, "greyscal": 17, "grid": [148, 151, 152, 153, 154, 159, 161, 165, 173, 174], "grid_world": 165, "gridlin": 165, "gridworld": [2, 148, 151, 152, 158, 165], "gridworldenv": [159, 165], "griesbach": 156, "grip": 174, "ground": [127, 129, 141, 148], "group": [129, 155], "grow": 161, "gt": [155, 156], "guarante": [5, 6, 13, 17, 148, 171], "guess": 155, "guid": [148, 156, 157, 159, 169], "guidelin": 17, "guyazran": 156, "gym": [2, 5, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 126, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 156, 157, 158, 159, 161, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "gym4real": 148, "gymfc": 148, "gymlibrari": 155, "gymnasium": [2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 157, 159, 160, 161, 162, 163, 166, 169, 172, 173, 174, 175, 176, 177, 178], "gymnasium_env": [159, 165], "gymnasium_robot": [136, 156, 160], "gymnax": 148, "gymv21compat": 156, "gymv21environ": 160, "gymv22compat": 156, "gymv22environ": 156, "gymv26environ": 160, "gyroscop": 128, "h": 153, "h5": 178, "ha": [1, 2, 4, 5, 7, 8, 9, 10, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 139, 140, 141, 144, 145, 146, 148, 150, 154, 155, 156, 157, 158, 159, 163, 165, 166, 169, 173, 174, 175, 177, 178], "hacki": 13, "had": [2, 155, 156], "half": 136, "half_cheetah": 138, "halfcheetah": [14, 136, 138], "halt": 166, "hand": [148, 150, 163, 177], "handl": [5, 10, 11, 12, 142, 150, 155, 156, 158, 160, 163, 168, 170, 174], "handling_time_limit": 166, "hang": [13, 131, 155], "hannah": 156, "happen": [133, 134, 137, 139, 140, 142, 143, 147, 150, 153, 154, 155, 156, 158, 159, 163, 166], "haracterist": 177, "hard": [156, 159, 160, 175], "hardcor": 127, "harden": [155, 156], "harder": [129, 169], "hardwar": [148, 155, 156], "harlei": 178, "harm": 174, "hasattr": 156, "hash_se": 155, "hasselmo": 131, "hatchl": 165, "have": [2, 4, 5, 7, 8, 10, 11, 13, 14, 15, 16, 17, 18, 126, 127, 128, 131, 137, 140, 141, 142, 143, 144, 145, 147, 150, 153, 154, 155, 156, 158, 159, 160, 163, 165, 166, 167, 169, 174, 175, 177, 178], "haven": 17, "head": [11, 138, 160], "headless": [136, 155], "healthi": [137, 139, 140, 142, 143, 147], "healthy_angle_rang": [139, 147], "healthy_reward": [137, 139, 140, 142, 143, 147, 169], "healthy_state_rang": 139, "healthy_z_rang": [137, 139, 140, 147, 169], "heart": [158, 163], "heatmap": [174, 175], "height": [131, 136, 137, 139, 140, 142, 147, 155, 156, 169], "held": 150, "hello": 7, "help": [2, 4, 5, 9, 155, 156, 158, 161, 164, 168, 170, 173, 174, 178], "helper": [155, 159], "helpingstar": 156, "henc": [137, 149, 177], "here": [3, 9, 131, 137, 140, 155, 156, 159, 161, 163, 165, 169, 178], "heurist": [127, 129, 148, 156], "hffg": 153, "hidden": [2, 177], "hidden_space1": 177, "hidden_space2": 177, "hierarch": [5, 154], "high": [2, 6, 7, 8, 11, 12, 13, 14, 18, 131, 132, 134, 135, 137, 148, 155, 156, 158, 163, 167, 169, 178], "higher": [19, 127, 144, 163, 169, 173, 178], "highest": [4, 163], "highli": [5, 9, 126, 130, 148, 155, 165], "highwayenv": [148, 156], "hill": [133, 134], "hing": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "hinge2": 142, "hint": [155, 156], "hinter": 155, "hip": [127, 137, 140, 141], "hip_1": 137, "hip_2": 137, "hip_3": 137, "hip_4": 137, "histor": [148, 159], "histori": 136, "histplot": 175, "hit": [150, 158, 159, 163, 174], "hold": [5, 150, 174], "hole": [153, 175], "homepag": 156, "hood": 156, "hook": [155, 156], "hooper": 156, "hop": [136, 139, 147], "hope": 156, "hopefulli": [155, 174], "hopper": [15, 16, 136, 147, 156], "hopper_v4": 15, "hopperenv": 15, "horizon": [9, 139, 148, 166], "horizon_timestep": 9, "horizont": [127, 129, 131, 159, 165], "host": 156, "hot": 8, "hotter": 155, "hour": 161, "hous": 163, "how": [2, 5, 6, 9, 11, 12, 14, 141, 142, 144, 145, 148, 156, 158, 159, 160, 161, 163, 165, 166, 167, 171, 174, 178], "howardh": 156, "howev": [2, 5, 6, 7, 8, 9, 10, 11, 13, 16, 17, 131, 137, 138, 139, 140, 141, 145, 146, 147, 155, 156, 158, 165, 166, 167, 174, 178], "hpo": 171, "html": [18, 177], "http": [1, 2, 10, 11, 12, 18, 19, 128, 131, 150, 151, 152, 153, 155, 156, 165, 169, 174, 175, 177, 178], "hue": 175, "huge": [148, 155], "hull": 127, "human": [2, 6, 9, 17, 20, 128, 136, 140, 141, 144, 148, 155, 156, 157, 158, 159, 160, 165, 169, 178], "humanoid": [136, 156, 169, 171], "humanoidstandup": [136, 141], "humanoidstandup_v4": 155, "humanrend": [17, 20, 156], "humnaoid": 169, "hundr": 161, "hundredth": 17, "hyperparam": 178, "hyperparamet": [161, 163, 171, 173, 174, 175, 177, 178], "i": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 172, 173, 174, 175, 176, 177, 178], "i_": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "ianyfan": 156, "ic": 153, "ice1187": 155, "iclr": 178, "icml": 178, "icu": 148, "id": [4, 17, 136, 137, 140, 141, 153, 156, 159, 165], "idea": [158, 166, 174], "ident": [7, 11, 12, 136, 156], "identifi": [155, 161], "idx": 175, "if__name__": 178, "iff": [9, 17, 165], "iforce2d": 128, "igibson": 148, "ignor": [1, 9, 150, 155, 160, 163, 174], "ikamensh": [155, 156], "illeg": 154, "illustr": [14, 165, 166], "im": 143, "imag": [2, 5, 10, 11, 12, 14, 17, 18, 20, 128, 136, 156, 158, 169], "imagesequenceclip": 9, "imagin": [148, 158, 167], "img": 173, "immedi": [9, 19, 20, 137, 139, 140, 141, 147, 150, 158, 159, 163, 165], "immut": 5, "impact": [141, 160, 175], "impact_cost": 141, "impact_cost_rang": 141, "impact_cost_weight": 141, "implement": [5, 6, 9, 10, 15, 16, 17, 20, 129, 132, 135, 142, 148, 149, 155, 156, 158, 159, 160, 161, 163, 164, 165, 168, 170, 171, 172, 173, 176, 177, 178], "implementing_custom_wrapp": 167, "implic": 160, "implicitli": 178, "import": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 163, 165, 167, 169, 173, 175, 177, 178], "importantli": [15, 156, 158], "importerror": 156, "imposs": [159, 163, 173], "improv": [11, 155, 156, 158, 160, 161, 162, 173], "imshow": 175, "inaccur": 163, "includ": [2, 4, 14, 17, 18, 20, 132, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 154, 155, 156, 158, 159, 161, 165, 166, 169, 171], "include_cfrc_ext_in_observ": [137, 140, 141, 169], "include_cinert_in_observ": [140, 141], "include_cvel_in_observ": [140, 141], "include_qfrc_actuator_in_observ": [140, 141], "inclus": [137, 155], "incompleteidea": [150, 151, 152], "inconsist": 160, "incorpor": 148, "incorrect": [154, 155, 156, 159, 166], "incorrectli": [19, 156], "increas": [129, 131, 132, 136, 139, 144, 146, 147, 156, 162, 163, 174, 175, 178], "incur": [131, 151, 152, 154], "independ": [6, 7, 10, 129, 139, 146, 147, 156, 173], "index": [1, 6, 9, 13, 14, 17, 18, 20, 132], "indic": [2, 9, 14, 17, 128, 131, 132, 150, 151, 152, 153, 154, 155, 163, 166, 173, 174, 175, 177], "individu": [2, 11, 12, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 155, 159, 165, 167, 173, 177], "indoril007": 155, "induc": [137, 138, 139, 140, 141, 146, 147], "induct": [137, 138, 139, 140, 141, 146, 147], "ineffici": [156, 162], "inelast": [133, 134], "inertia": [140, 141], "inf": [2, 10, 16, 18, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 158, 167, 169], "infam": 174, "infeas": 7, "infer": [7, 155], "infinit": [16, 17, 18, 129, 139, 150, 155, 156, 158, 159, 163, 166, 174], "info": [2, 3, 9, 10, 11, 12, 14, 17, 18, 19, 20, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 157, 158, 159, 160, 161, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "inform": [1, 2, 5, 6, 7, 9, 10, 11, 12, 18, 20, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 159, 160, 163, 165, 166, 169, 174, 177], "infti": [7, 139], "inher": 166, "inherit": [4, 5, 15, 16, 18, 19, 155, 156, 159, 165], "init": [128, 159, 161, 165, 178], "initi": [2, 3, 4, 6, 7, 9, 10, 14, 15, 16, 17, 18, 19, 127, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 159, 161, 163, 167, 169, 173, 174, 175, 177, 178], "initial_epsilon": [163, 174], "initial_sampl": 156, "initialis": [2, 4, 10, 17, 150, 156, 157], "inlin": 178, "inner": 11, "inner_st": 6, "inplac": 177, "input": [9, 10, 156, 158, 159, 174, 178], "inregular": 17, "insert": [157, 177], "insid": [1, 6, 7, 17, 148, 154, 159, 165], "insight": [148, 158, 163], "inspect": 9, "inspir": [151, 152, 156, 175], "instabl": [162, 163], "instal": [1, 9, 17, 126, 130, 136, 155, 156, 158, 160, 165, 169], "instanc": [2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 17, 18, 156, 158, 159, 162, 167, 178], "instanti": [9, 14, 17, 18, 19, 165, 175], "instead": [2, 10, 11, 14, 15, 127, 131, 137, 140, 147, 155, 156, 158, 159, 160, 161, 163, 165, 178], "institut": [133, 134], "instruct": [136, 148, 156, 165], "insuffici": 163, "int": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 136, 137, 150, 151, 152, 153, 154, 156, 159, 163, 165, 173, 174, 175, 177, 178], "int23": 17, "int32": [6, 8, 10, 14, 18, 159], "int64": [6, 7, 8, 156, 159], "int8": [5, 7], "int_32": 17, "integ": [2, 6, 7, 8, 9, 14, 16, 17, 18, 155, 156, 159, 165], "integr": [9, 156, 169], "intellig": [154, 155, 158, 163], "intend": [3, 14, 17, 148, 151, 152, 153, 154, 171, 175], "intens": 148, "interact": [5, 9, 14, 17, 20, 148, 158, 159, 163, 165, 174, 178], "interest": [18, 156, 161, 169], "interestingli": 175, "interfac": [9, 156, 157, 158], "interlink": 158, "intermedi": [140, 141, 159], "intermitt": 17, "intern": [2, 3, 10, 155, 156, 159, 160, 161], "internet": 148, "interoper": 148, "interv": [7, 137, 139, 140, 147, 161], "intrins": 167, "introduc": [137, 140, 141, 148, 155, 156, 160], "introduct": [131, 150, 151, 152, 175], "introductori": 156, "invalid": [2, 7, 156, 159, 169, 173, 174], "invers": 4, "invert": [135, 136, 177], "inverted_double_pendulum": 142, "inverted_pendulum": [143, 177], "inverteddoublependulum": [136, 142], "invertedpendulum": [136, 143, 177], "investig": 156, "involv": [6, 126, 142, 148, 151, 152, 153, 154, 155, 156, 165, 177], "io": [18, 148, 153], "ipynb": [165, 166, 167, 169, 173, 174, 175, 177, 178], "irrelev": 159, "irrespect": 9, "is_avail": 178, "is_bound": 7, "is_np_flatten": [5, 156], "is_rain": 154, "is_raini": 154, "is_slipperi": [151, 152, 153, 156, 175], "is_slippi": 156, "is_vector_env": 9, "isaac": 148, "isinst": 156, "isn": [6, 9, 156, 159, 161], "isort": 156, "issu": [17, 18, 129, 132, 136, 137, 139, 140, 141, 142, 143, 144, 145, 147, 155, 156, 160, 161, 165], "itch": 153, "item": [9, 13, 18, 174, 175, 178], "iter": [5, 6, 12, 13, 156, 159], "itomori": 148, "its": [2, 9, 16, 17, 129, 135, 136, 137, 139, 141, 144, 147, 148, 156, 158, 160, 175, 177, 178], "itself": [3, 8, 10, 11, 12, 15, 17, 155, 156, 158, 159, 160, 178], "j": [156, 177, 178], "jack": 150, "jair": 154, "jamartinh": 156, "jax": [2, 14, 17, 20, 148, 156, 162], "jax_to_numpi": 156, "jaxenv": [14, 17], "jaxtonumpi": [14, 17, 20, 156], "jaxtotorch": [14, 17, 20, 156], "jessefarebro": 155, "jet": 156, "jfpettit": 155, "jimini": 148, "jin": 156, "jit": 162, "jjshoot": [155, 156], "jkterry1": 155, "jnp": 17, "job": [148, 165], "job_statu": 6, "john": 156, "johnminelli": 155, "johnnycode8": 171, "join": [5, 156], "joint": [127, 129, 131, 132, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "joint0": 145, "joint1": 145, "jordan": [137, 156, 178], "journal": 154, "journei": [155, 174], "json": 156, "json_env_spec": 156, "jsonabl": 5, "jump": 169, "jumpi": 156, "jun": 156, "junk": 14, "jupyt": [1, 155, 165, 166, 167, 169, 170, 173, 174, 175, 177, 178], "just": [3, 13, 15, 143, 145, 155, 156, 158, 159, 160, 162, 163, 165, 169, 178], "k": [8, 9, 14, 129, 146, 156, 178], "kad99kev": 156, "kalli": 169, "kallinteri": [156, 169], "karp": 178, "kavukcuoglu": 178, "kde": 175, "keep": [9, 14, 17, 18, 20, 132, 141, 143, 159, 163, 165], "keep_dim": [14, 18], "kei": [2, 4, 5, 6, 7, 9, 10, 14, 17, 18, 20, 137, 138, 139, 140, 141, 146, 147, 151, 152, 153, 154, 155, 156, 158, 163, 165, 166, 167, 173, 174, 175], "kellycoinflip": 155, "kept": [10, 136, 169], "kerajli": 156, "kexianshen": 155, "key_to_act": 9, "keyb0ardninja": 156, "keyboard": [7, 9, 155], "keys_to_act": [9, 155, 178], "keyword": [4, 6, 10, 11, 12, 14, 131, 132, 150, 155, 156, 158, 165, 174], "kg": [155, 156], "khoda81": 156, "kind": 7, "king": 150, "kir0ul": [155, 156], "klimov": [126, 127, 128, 129], "knee": [127, 140, 141], "know": [2, 156, 158, 159, 160, 162, 163, 165], "knowledg": [4, 163], "known": [2, 163], "krimmel": 156, "kvrban": 156, "kwarg": [3, 4, 9, 10, 11, 12, 14, 15, 137, 138, 139, 140, 146, 147, 156, 165], "kwiatkowski": 156, "l": [14, 17, 146, 156, 161], "l2r": 148, "lab_black": 175, "label": [161, 173, 174, 175], "laboratori": 148, "lack": 156, "ladder": 127, "lai": 141, "lake": [149, 155, 156], "lam": 178, "lambaactionv0": 156, "lambda": [11, 12, 14, 16, 17, 18, 19, 156, 161, 163, 174, 178], "lambdaact": 14, "land": 129, "lander": [126, 155, 156], "lane": 148, "lap": [128, 155], "lap_complete_perc": 128, "larg": [11, 129, 134, 137, 138, 139, 140, 141, 144, 145, 146, 147, 148, 155, 156, 162, 163, 167, 169, 175], "larger": [163, 178], "largest": 155, "last": [9, 13, 14, 17, 18, 20, 141, 144, 145, 155, 156, 161, 165, 166, 175], "latent": 148, "later": [129, 158, 159, 161, 163, 174, 177, 178], "latest": [2, 162, 177], "latin": 7, "latter": [151, 152], "lava": 2, "layer": [3, 15, 158, 159, 177], "lazili": 5, "lazyfram": 18, "lead": [160, 178], "learn": [2, 5, 6, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 138, 142, 143, 146, 148, 149, 150, 151, 152, 154, 155, 156, 157, 161, 162, 165, 169, 170, 171, 173, 176, 178], "learner": 175, "learning_r": [163, 173, 174, 175, 177], "learnt": 4, "least": [7, 129, 136], "leav": [132, 142, 165, 175], "left": [7, 127, 128, 129, 132, 133, 137, 140, 141, 142, 143, 147, 151, 152, 153, 154, 158, 159, 165, 169, 173, 174, 175, 177], "left_elbow": [140, 141], "left_elfbow": [140, 141], "left_foot": [140, 141], "left_hip_i": [140, 141], "left_hip_x": [140, 141], "left_hip_z": [140, 141], "left_hiz_z": [140, 141], "left_kne": [140, 141], "left_lower_arm": [140, 141], "left_shoulder1": [140, 141], "left_shoulder2": [140, 141], "left_sin": [140, 141], "left_thigh": [140, 141], "left_upper_arm": [140, 141], "leg": [127, 129, 137, 139, 140, 141, 147], "leg_joint": [139, 147], "leg_left_joint": 147, "legaci": 155, "legend": [161, 173, 174, 175], "legend_el": 174, "len": [6, 17, 161, 163, 167, 173, 174, 178], "length": [4, 6, 7, 9, 11, 12, 14, 17, 20, 127, 131, 132, 133, 134, 146, 148, 153, 154, 155, 156, 158, 161, 163, 174, 178], "length_mask": 6, "length_moving_averag": [163, 174], "length_queu": [14, 17, 161, 163, 174], "leq": 142, "less": [127, 129, 146, 147, 158, 163, 175], "lesson": 175, "let": [148, 156, 158, 159, 163, 165, 167, 173, 174, 175, 177], "letter": [153, 154, 155], "level": [9, 15, 158, 161, 169], "levin": [137, 178], "lg": 156, "li": [141, 156], "lib": [151, 152], "librari": [148, 156, 157, 165, 169], "licens": [155, 156, 165, 174, 175, 177, 178], "lidar": 127, "life": [17, 155, 156, 177], "lift": 144, "light": 148, "lighter": 156, "lightgreen": 174, "lightli": 160, "lightweight": [148, 161], "ligibl": 177, "like": [3, 5, 7, 9, 13, 14, 15, 16, 17, 18, 19, 20, 138, 143, 147, 148, 154, 155, 156, 158, 159, 161, 163, 165, 167, 169, 171, 178], "lillicrap": 178, "limit": [17, 20, 132, 143, 155, 156, 158, 159, 160, 162, 163, 168, 170, 174, 177, 178], "lin826": 155, "linalg": [9, 159, 165], "line": [2, 5, 131, 155, 156, 159, 165], "linear": [10, 129, 131, 142, 143, 146, 177, 178], "linearli": [14, 16, 18, 20, 131, 142, 143, 177], "linecolor": 175, "lineplot": [175, 177], "linewidth": [161, 173, 174, 175], "link": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 131, 137, 145, 146, 156, 165], "linux": 156, "list": [2, 4, 5, 6, 7, 9, 10, 11, 12, 14, 15, 17, 18, 155, 156, 158, 159, 161, 174, 175, 178], "list_info": 14, "listdir": 17, "liter": 156, "littl": [129, 156, 159, 163], "live": [1, 9, 159, 174], "ll": [155, 158, 159, 161, 163, 173, 174, 178], "llvm": 148, "load": [4, 155, 156, 168, 170], "load_env_cr": 4, "load_ext": 175, "load_quadruped_model": 169, "load_state_dict": 178, "load_weight": 178, "loc": [154, 178], "local": 165, "localhost": 1, "locat": [4, 136, 148, 151, 152, 153, 154, 159, 165, 173], "log": [2, 9, 14, 16, 17, 18, 19, 161, 175, 177, 178], "log_prob": [177, 178], "logan": 156, "logger": [17, 155], "logic": [11, 128, 155, 156, 159, 163, 165, 169], "logical_or": 156, "logit": 178, "long": [7, 9, 17, 132, 143, 148, 155, 156, 159, 161, 163], "longer": [2, 136, 137, 139, 143, 147, 155, 156, 160, 177], "look": [5, 9, 17, 158, 160, 161, 165, 166, 167, 175, 178], "loop": [148, 160, 174, 178], "lose": [129, 150, 163, 174], "loss": [17, 150, 163, 177, 178], "lost": 17, "lot": [15, 163, 167, 174, 177], "low": [2, 6, 7, 8, 12, 13, 14, 18, 131, 132, 134, 135, 155, 156, 163, 167, 173, 178], "lower": [7, 14, 15, 19, 20, 140, 141, 155, 158, 163, 174, 178], "lower_waist": [140, 141], "lpizzinidev": 156, "lr": [163, 174, 175, 177, 178], "lt": [155, 156], "lucasalegr": 156, "lunar": [126, 155, 156], "lunar_land": [129, 156], "lunarland": [17, 129, 155, 156, 157, 160, 163, 178], "lunarlandercontinu": 167, "lwaist": [140, 141], "lz4": 18, "m": [8, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 169, 178], "mab": 148, "machado": [16, 17], "machin": [155, 175, 177], "made": [1, 129, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 160, 169, 171, 178], "magnitud": [9, 129, 134, 142, 143, 177], "mahiuchun": 155, "mai": [2, 5, 7, 8, 9, 11, 14, 15, 16, 18, 19, 151, 152, 153, 158, 160, 165, 169, 178], "main": [2, 129, 139, 147, 156, 160, 169, 175], "main_bodi": [137, 169], "mainli": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "maintain": [136, 148, 155, 156, 157, 160, 171, 173], "mainten": 155, "major": [155, 156], "make": [1, 2, 6, 9, 11, 12, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 160, 161, 163, 167, 168, 169, 170, 173, 174, 175, 177, 178], "make_dict": 14, "make_vec": [2, 4, 9, 10, 11, 12, 14, 132, 156, 159, 162, 178], "malici": 156, "manag": [4, 13, 148, 163], "mandatori": [159, 165], "manhattan": [159, 165], "mani": [7, 14, 17, 136, 148, 155, 156, 159, 160, 163, 165, 174, 175], "manipul": 148, "manner": [3, 7, 18, 20, 155], "mantasu": 156, "manual": [9, 14, 158, 178], "manual_se": 177, "manuel": 156, "manufactur": 169, "map": [9, 14, 17, 153, 154, 156, 158, 159, 163, 165, 174, 177], "map_nam": 153, "map_siz": 175, "mar": [148, 156], "mariojerez": 156, "marionj": 156, "mark": 156, "markdown": 1, "market": 148, "markov": [148, 156, 158, 166], "markovian": 148, "marku": 156, "markus28": [155, 156], "marsexplor": 148, "mask": [5, 6, 7, 148, 154, 155, 156, 170, 176, 178], "masked_mean_curv": 173, "masked_mean_reward": 173, "masked_overall_mean": 173, "masked_overall_std": 173, "masked_result": 173, "masked_results_list": 173, "mass": [129, 137, 140, 141, 146], "massiv": 155, "master": [18, 151, 152, 155, 158, 177], "match": [4, 8, 11, 12, 16, 132, 156], "math": [135, 148, 155, 163], "mathbb": 7, "mathcal": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "mathemat": [5, 158, 177], "matplotlib": [9, 161, 163, 173, 174, 175, 177, 178], "matpoliquin": 156, "matric": [5, 148], "matrix": [6, 140, 141, 148], "matter": [7, 155, 159, 160], "matyasch": 156, "max": [4, 7, 14, 16, 17, 18, 20, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 153, 156, 163, 173, 174, 175, 177, 178], "max_a": 166, "max_act": [14, 15, 16, 20], "max_episode_step": [4, 17, 156, 159, 165, 169, 178], "max_geom": 136, "max_id": 175, "max_length": 7, "max_ob": [14, 18, 20], "max_reward": [10, 14, 19, 156, 167], "max_time_step": [132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "maxandskipenv": 18, "maxandskipobserv": [18, 20, 156], "maxim": [159, 163, 177, 178], "maximis": 162, "maximum": [4, 7, 9, 14, 17, 18, 20, 129, 131, 135, 142, 156, 158, 163, 165, 173, 175, 178], "maxq": 154, "mayb": [2, 175], "maze": 159, "mclean": 156, "md": [1, 155, 156, 165], "mdp": [2, 17, 133, 134, 148, 158], "mean": [2, 14, 18, 19, 20, 131, 139, 144, 155, 156, 163, 165, 173, 175, 177, 178], "mean_reward": 173, "meaning": 163, "meant": 3, "meantim": 156, "measur": [9, 127, 135, 141, 142, 144, 145, 155, 159], "mechan": 156, "medium": 148, "mel": 153, "melbourn": 175, "melt": 177, "member": 5, "memori": [5, 17, 133, 134, 155, 156, 161, 162], "menageri": 169, "mention": [156, 177], "menu": 158, "mere": 165, "merg": 156, "meshcat": 148, "meshgrid": 174, "messag": [5, 155, 156, 161], "meta": [148, 155], "metaclass": 155, "metadata": [2, 3, 9, 10, 15, 17, 155, 156, 165, 167], "metatrad": 148, "metaworld": 148, "meter": [135, 148], "meth": [7, 17], "method": [3, 4, 6, 9, 14, 16, 17, 18, 19, 148, 155, 156, 159, 160, 163, 165, 167, 177, 178], "methodologi": 148, "metric": [2, 9, 156, 161, 178], "mgoulao": 156, "micim": 155, "microgrid": 148, "mid": 160, "middl": [139, 147, 163], "might": [2, 5, 7, 8, 15, 16, 158, 159, 162, 165, 167, 174, 177, 178], "migrat": [136, 156, 157], "mihaic": 156, "mileston": 161, "miller": 175, "min": [7, 14, 16, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "min_act": [14, 15, 16, 20], "min_length": 7, "min_ob": [14, 18, 20], "min_reward": [10, 14, 19, 156, 167], "minari": 148, "minatari": 148, "mind": 156, "mine": 148, "minecraft": 148, "minesweep": 148, "minetest": 148, "miniatur": 148, "minibatch": 178, "minigrid": [148, 156], "minim": [2, 148, 156, 159, 165, 166, 175, 178], "minimalist": 148, "minimum": [7, 14, 18, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 158, 159, 163, 175], "miniwob": 148, "miniworld": 148, "minor": [155, 156], "mirza": 178, "misc": [155, 156], "mischapanch": 156, "miss": [131, 154, 155, 156, 158, 159, 161], "mission": 5, "mistak": [156, 158, 159], "mit": [131, 174, 175, 177, 178], "mitig": 178, "mixtur": 156, "mj_camera": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "mj_step": [137, 140], "mjcf": 169, "mjdata": 136, "mjtvisflag": 136, "mjvcamera": 136, "mjvis_contactforc": 136, "mjvis_contactpoint": 136, "mjvisual": 136, "mkdir": [173, 178], "ml": [148, 155], "mmcaulif": 156, "mnih": 178, "mo": 148, "moba": 148, "mobil": 148, "modal": 136, "mode": [2, 4, 10, 11, 12, 14, 155, 156, 158, 161, 163, 165, 174, 178], "model": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 156, 159, 160, 171, 174], "modern": [148, 160], "modif": 167, "modifi": [2, 4, 5, 10, 14, 15, 16, 18, 19, 20, 131, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 159, 165, 167], "modul": [4, 5, 13, 155, 156, 165, 167, 177, 178], "modular": [14, 15, 148, 158, 165, 167], "module_nam": 156, "moduletyp": [14, 17], "mojoco": 171, "moment": 3, "monitor": [17, 155, 156, 161], "monop": 136, "mont": [163, 174, 177, 178], "month": 156, "moon": 129, "moor": [133, 134], "moore90efficientmemori": [133, 134], "more": [1, 2, 5, 6, 7, 10, 11, 12, 14, 15, 16, 19, 20, 127, 129, 136, 137, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 160, 162, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "moreov": [5, 14, 15, 17, 165, 167], "moritz": [137, 178], "most": [2, 5, 7, 13, 14, 15, 17, 18, 136, 145, 148, 155, 156, 158, 160, 162, 163, 165, 167, 169, 170, 172, 174, 176], "mostli": [155, 163], "motion": 148, "motor": [127, 146, 148, 155, 169], "motor1_rot": 146, "motor2_rot": 146, "mountain": [130, 155, 158], "mountaincar": [14, 133, 163, 171], "mountaincarcontinu": [14, 16, 19, 134], "mountaincarenv": 133, "move": [2, 14, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 129, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 153, 154, 155, 156, 158, 159, 160, 161, 163, 165, 166, 169, 173, 175, 177], "movement": [154, 159, 163, 165], "moviepi": [9, 17, 155, 156], "moving_avg": 161, "mozer": 131, "mp": 13, "mp4": 161, "mpi": 13, "mpi4pi": 13, "mpi_init": 13, "mt19937": 155, "mtsim": 148, "much": [155, 156, 159, 160, 163, 165, 166, 169], "mujoco": [1, 9, 15, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 167, 169, 170, 176], "mujoco_env": [155, 156], "mujoco_gl": 136, "mujoco_menageri": 169, "mujoco_reinforc": 177, "mujoco_rend": 155, "mujocoenv": 156, "mujocorend": 156, "mujocorender": 156, "multi": [2, 7, 136, 140, 141, 144, 148, 159], "multiag": 148, "multibinari": [5, 6, 7, 8, 13, 18, 156, 158], "multidiscret": [5, 6, 7, 8, 10, 13, 18, 155, 156, 158, 165], "multimod": 148, "multipl": [5, 6, 7, 10, 11, 12, 13, 155, 156, 158, 159, 161, 162, 173, 178], "multipli": [6, 129, 134, 144, 145, 178], "multiprocess": [5, 11, 13, 178], "multivari": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "must": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 128, 136, 139, 147, 155, 156, 159, 163, 165, 166], "mutual": 136, "my": 175, "my_packag": 159, "mypi": [2, 156], "n": [4, 5, 6, 7, 8, 11, 12, 13, 17, 18, 20, 128, 131, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 161, 163, 173, 174, 175, 177, 178], "n_action": [173, 178], "n_env": 178, "n_episod": [163, 174], "n_featur": 178, "n_run": [173, 175], "n_showcase_episod": 178, "n_state": 173, "n_steps_per_upd": 178, "n_updat": 178, "na": 145, "name": [1, 3, 4, 11, 12, 15, 20, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 159, 161, 165], "name_prefix": [9, 17, 161], "namedtupl": [156, 175], "namespac": [4, 159, 165], "nanoquadrotor": 148, "narrow": 175, "nativ": 17, "natur": [148, 150, 153, 160, 163, 174], "naverag": 161, "navig": [148, 154, 159, 165, 167], "nbodi": [137, 140, 141], "nchain": 155, "ncol": [151, 152, 153, 163, 174, 175, 178], "ncrement": 177, "ndarrai": [2, 3, 6, 7, 8, 9, 13, 14, 16, 17, 18, 19, 131, 132, 133, 134, 135, 154, 177, 178], "neccari": 9, "necessari": [2, 5, 126, 155, 156, 173], "necessarili": 8, "need": [2, 5, 6, 9, 14, 15, 16, 18, 127, 129, 132, 136, 155, 156, 158, 159, 160, 161, 162, 163, 165, 166, 167, 169, 173, 174, 175, 178], "need_visu": 160, "neg": [2, 7, 9, 134, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 154, 158, 159, 163, 177], "neither": [7, 17, 150, 154], "nerdyespresso": 156, "nervous": 127, "nest": [6, 13, 148], "net": [128, 150, 151, 152, 177, 178], "network": [5, 8, 10, 13, 146, 148, 158, 159, 163, 178], "neural": [5, 8, 10, 13, 131, 146, 148, 159, 163, 177, 178], "neurip": 131, "neuro": 148, "neuroflight": 148, "neuronlik": [132, 142, 143], "nevalu": 161, "never": [2, 138, 141, 144, 145, 146, 156, 173], "nevertheless": 167, "new": [2, 5, 14, 15, 16, 17, 18, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 146, 147, 154, 155, 156, 157, 158, 159, 162, 163, 165, 166, 167, 169, 174, 175, 178], "new_action_spac": 14, "new_obs_spac": 14, "new_po": 159, "new_q": 163, "new_spac": 14, "new_stat": 175, "new_throughput": 9, "newer": [136, 155], "newli": [14, 18, 19], "newlin": 2, "next": [2, 3, 10, 13, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 156, 157, 169, 173, 177], "next_mask": 173, "next_max": 173, "next_ob": [156, 160, 163, 174, 177], "next_stat": [3, 156, 163, 173, 174], "next_step": [11, 12], "next_valu": 160, "nice": 155, "nidhish": 156, "nine": 137, "nintendo": 7, "nip": 131, "nlp": 148, "nlpgym": 148, "nn": [177, 178], "no_grad": 178, "node": [5, 6, 8, 155, 158], "node_spac": [6, 8], "nois": [130, 136, 156], "noisi": [161, 163], "non": [2, 5, 8, 9, 14, 17, 129, 132, 137, 138, 139, 140, 141, 146, 147, 148, 153, 155, 156, 159, 165, 166, 177], "non_random_ob": 128, "nonbreak": 155, "nondeterminist": [4, 165], "none": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 136, 153, 155, 156, 158, 159, 160, 165, 173, 174, 175, 178], "nonlinear": 139, "nonzero": 173, "noop": [7, 9, 17, 154, 156, 178], "noop_max": [17, 156], "nor": [7, 17, 150, 151, 152, 154], "norm": [9, 144, 145, 159, 165], "normal": [2, 4, 7, 10, 13, 14, 17, 18, 19, 20, 127, 128, 135, 137, 138, 142, 155, 156, 162, 163, 177, 178], "normalis": 156, "normalize_tim": 18, "normalizeobserv": [14, 18, 20, 155, 156], "normalizereward": [14, 19, 20, 155], "normalizex": 156, "north": [154, 173], "notabl": [155, 156, 166], "note": [1, 5, 9, 13, 14, 17, 18, 131, 132, 136, 137, 139, 140, 141, 142, 144, 147, 154, 158, 160, 162, 166, 169, 174, 177, 178], "notebook": [1, 155, 165, 166, 167, 169, 170, 173, 174, 175, 177, 178], "noth": [3, 128, 129, 156, 159, 177], "notic": 156, "notif": 156, "notimplementederror": 8, "nov": 154, "now": [2, 127, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 159, 163, 165, 166, 169, 173, 174, 175, 177], "np": [2, 5, 6, 7, 9, 10, 12, 13, 14, 16, 18, 19, 129, 133, 140, 141, 154, 155, 156, 159, 161, 163, 165, 167, 169, 173, 174, 175, 177, 178], "np_random": [2, 5, 9, 10, 11, 12, 15, 155, 156, 159, 165], "np_random_se": [2, 10, 11, 12, 15, 156], "nrow": [153, 175, 178], "nstep": 156, "num": [14, 17, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "num_col": 4, "num_edg": 6, "num_env": [4, 10, 11, 12, 13, 14, 132, 156, 159, 178], "num_episod": 163, "num_eval_episod": 161, "num_nod": 6, "num_training_episod": 161, "number": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 16, 17, 18, 20, 128, 129, 131, 136, 139, 140, 141, 146, 147, 148, 150, 153, 155, 156, 158, 159, 161, 162, 163, 165, 169, 175, 177, 178], "numer": [142, 143, 150, 155, 156, 161, 167, 177], "numpi": [2, 5, 7, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 155, 156, 159, 161, 163, 165, 167, 169, 173, 174, 175, 177, 178], "numpytotorch": [14, 17, 20, 156], "nv": [140, 141], "nvec": 7, "nvidia": 148, "o": [17, 161, 177, 178], "o_": 166, "o_t": 166, "ob": [9, 12, 14, 16, 17, 18, 128, 154, 155, 156, 158, 159, 160, 161, 163, 167, 169, 174, 177], "obj_slidei": 144, "obj_slidex": 144, "object": [2, 5, 9, 11, 12, 13, 14, 15, 136, 144, 145, 148, 156, 158, 161, 174, 177], "obs0": 18, "obs1": 18, "obs2": 18, "obs3": 18, "obs4": 18, "obs_kei": 18, "obs_shap": 178, "obs_space_dim": 177, "obs_t": 9, "obs_tp": 9, "obs_tp1": 9, "observ": [2, 3, 4, 5, 6, 9, 10, 11, 12, 13, 15, 17, 19, 20, 148, 155, 156, 157, 160, 162, 163, 166, 167, 173, 175, 177], "observation_mod": [11, 12], "observation_spac": [2, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 18, 158, 159, 165, 167, 173, 175, 177], "observation_structur": [137, 138, 139, 140, 141, 143, 146, 147], "observationwrapp": [14, 15, 18, 165, 169], "obstacl": 159, "obstructview": 156, "obstyp": [2, 3, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 156, 177], "obswrapp": 155, "obtain": [15, 17, 135, 150, 166], "obviou": 166, "obvious": 156, "occur": [2, 10, 131, 132, 165, 178], "octob": 136, "odyse": 169, "off": [17, 128, 129, 151, 152, 154, 155, 156, 158, 159, 173, 175], "offer": 148, "offici": 3, "offlin": [148, 156], "offscreen": [155, 156], "offset": [129, 140, 141], "offworld": 148, "often": [2, 5, 148, 156, 163, 165, 175], "oftentim": 165, "old": [10, 16, 136, 155, 156, 157], "old_epsilon": 163, "old_po": 159, "old_spac": 14, "old_throughput": 9, "older": [136, 156, 160], "oldv21env": 160, "oldv26env": 160, "oleg": [126, 127, 128, 129], "olimoyo": 155, "olipinski": [155, 156], "omar": 156, "omega_1": 142, "omega_2": 142, "omesa": 136, "omg": 148, "omit": [137, 138, 139, 140, 141, 146, 147], "omniisaacgymenv": 148, "omnivers": 148, "onc": [1, 17, 154, 155, 159, 160, 163, 165, 174, 178], "one": [2, 5, 6, 7, 8, 9, 11, 15, 16, 131, 132, 133, 134, 135, 136, 137, 139, 142, 143, 146, 150, 154, 155, 156, 159, 161, 163, 166, 167, 169, 174, 175, 177, 178], "oneof": [5, 6, 8, 13, 156], "ones": [14, 130, 155, 163, 174, 178], "ongo": 178, "onli": [2, 4, 5, 6, 7, 8, 9, 10, 17, 18, 131, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 145, 146, 147, 154, 155, 156, 159, 160, 161, 165, 167, 169, 173, 174, 175, 178], "onlin": [140, 141, 150, 151, 152, 160], "onward": 166, "op": [17, 156], "open": [1, 17, 136, 148, 155, 156, 158, 165], "openai": [2, 19, 126, 155, 156, 157, 166, 174, 177], "opencv": [14, 17, 18, 20, 155], "opengl": [136, 156], "openmodelica": 148, "oper": [8, 14, 136, 148, 155], "oppon": 159, "opportun": 148, "opt": 169, "optim": [13, 14, 17, 127, 129, 140, 141, 148, 156, 158, 159, 160, 163, 174, 175, 177, 178], "optimis": [10, 148, 155, 171], "optimist": 163, "option": [2, 3, 4, 5, 6, 7, 10, 11, 12, 14, 15, 18, 128, 131, 132, 133, 134, 135, 136, 148, 155, 156, 158, 159, 160, 165], "ord": [9, 159, 165], "order": [4, 5, 6, 15, 17, 129, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 162, 165, 175], "order_enforc": [4, 165], "ordereddict": 156, "orderenforc": [4, 15, 17, 20, 127, 128, 129, 131, 132, 133, 134, 135, 155, 156, 158, 159, 165], "orderli": 155, "org": [10, 11, 12, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 156, 174, 177, 178], "orient": [129, 137, 140, 141], "origin": [8, 10, 14, 16, 17, 18, 128, 131, 132, 136, 142, 155, 156, 158, 159, 160, 163, 169], "orsini": 155, "osmesa": 136, "other": [14, 16, 20, 129, 135, 136, 138, 140, 142, 146, 147, 153, 154, 155, 156, 158, 160, 161, 163, 165, 167, 169, 171, 174, 175, 177, 178], "otherwis": [2, 4, 6, 7, 9, 11, 12, 14, 17, 18, 139, 155, 156, 159, 174, 175], "our": [156, 158, 159, 160, 163, 165, 169, 174, 175, 178], "out": [2, 3, 13, 14, 15, 148, 155, 156, 165, 166, 167, 171, 177], "outcom": [150, 175], "outer": 131, "outermost": 14, "outlin": [150, 155, 158, 159, 163, 174], "output": [1, 9, 10, 13, 14, 17, 155, 156, 158, 159, 165, 174, 177, 178], "output_truncation_bool": 9, "outsid": [2, 14, 18, 128, 129, 155, 156, 159, 166], "outweigh": 156, "over": [5, 9, 13, 17, 138, 140, 150, 153, 155, 156, 158, 161, 163, 167, 169, 173, 174, 178], "overal": 156, "overcom": 175, "overfit": [169, 178], "overflow": 156, "overhaul": 156, "overhead": 129, "overrid": [4, 11, 14, 156, 167], "overview": 177, "overwrit": [16, 18, 19], "overwritten": [15, 155, 156], "own": [11, 15, 148, 156, 158, 160, 161, 163, 167, 168, 169, 170], "p": [138, 148, 151, 152, 153, 154, 155, 175, 178], "p_": [144, 145], "p_0": 148, "pace": 148, "packag": [1, 10, 17, 126, 136, 148, 155, 156, 159, 175], "package_data": 155, "pad": [18, 129, 156], "padding_typ": [18, 156], "page": [16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 156, 158, 159, 160, 162, 163, 171], "painlessli": 5, "pair": [136, 140, 141, 163], "palett": 177, "pan": 144, "panda": [148, 175, 177], "paper": [131, 142, 148, 156, 161, 162], "paradigm": 2, "parallel": [10, 11, 12, 14, 148, 156, 159, 161, 162, 178], "param": [3, 7, 9, 156, 175], "paramet": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 160, 163, 165, 167, 173, 177, 178], "parameter": [2, 177, 178], "parameter_tun": 155, "parametr": [5, 177], "parent": [13, 173], "pars": 4, "parse_env_id": 4, "parser": 156, "part": [17, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 159, 166, 169, 175], "parti": [136, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 165], "partial": [2, 148, 155, 156, 159], "particular": [5, 6, 9, 10, 20, 129, 156, 158, 162, 166, 169, 175], "particularli": [9, 17, 18, 132, 156, 159], "pass": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 128, 137, 138, 139, 140, 141, 146, 147, 155, 156, 158, 159, 160, 165, 167, 178], "passeng": [154, 173], "passenger_loc": 154, "passidx": 154, "passiv": [17, 20, 155, 156], "passiveenvcheck": [4, 15, 17, 20, 127, 128, 129, 131, 132, 133, 134, 135, 156, 158, 159], "past": [14, 18, 19, 155], "patch": [155, 174], "path": [4, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 156, 159, 161, 165, 173, 178], "pathlib": 173, "patienc": [155, 163], "pattern": [160, 161], "paulmest": 156, "paw": 138, "pcg64": 155, "pd": [175, 177], "pdf": [131, 150, 151, 152], "peg": 155, "pelvi": [140, 141], "penal": [137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 167], "penalis": [133, 134], "penalti": [154, 159], "pend": [11, 155], "pendulum": [11, 12, 18, 130, 131, 132, 136, 155, 158, 177], "pendulumenv": 135, "per": [7, 9, 10, 17, 129, 132, 154, 155, 162, 163, 166, 169, 173, 178], "percentag": [128, 174], "peretz": 156, "perez": 156, "perf_count": 155, "perfect": [158, 159, 163], "perfectli": 165, "perform": [2, 5, 14, 17, 145, 155, 156, 158, 161, 162, 163, 169, 173, 177], "period": 139, "perman": [144, 145], "permiss": [155, 156], "perpendicular": [151, 152, 153, 175], "perpendicularli": 142, "person": 131, "perspect": 148, "perturb": [137, 138, 139, 140, 141, 142, 143, 146, 147], "pet": 158, "pettingzoo": [2, 148, 155], "pge": 148, "phase": [148, 159, 178], "phd": [133, 134, 146], "philosoph": 9, "photorealist": 148, "phys2d": 17, "physic": [2, 126, 136, 142, 143, 144, 145, 148, 155, 156, 159, 177], "pi": [129, 131, 133, 135], "pick": [154, 163, 169, 173, 174, 175, 178], "pickl": [1, 13, 155, 156], "pickled_env_spec": 156, "pickup": [154, 173], "pictur": [158, 161], "piec": 165, "pierrecounath": 156, "pierremardon": 156, "pierr\u00e9": [156, 175], "pinocchio": 148, "pip": [1, 126, 130, 136, 155, 156, 158, 160, 165, 169], "pip3": 155, "pipe": [11, 155], "pipx": 165, "pirata": 155, "pitfal": 127, "pix_square_s": 165, "pixel": [2, 18, 128, 148, 158, 160, 165], "pixelobservationwrapp": [18, 155, 156], "pixelobswrapp": 155, "pixels3d": 165, "pkuderov": 156, "place": [9, 17, 132, 133, 134, 156, 159, 165, 178], "plai": [9, 128, 148, 155, 156, 158, 159, 163, 174], "plan": [148, 155, 156, 159], "plateau": 163, "platform": 148, "playablegam": 9, "player": [148, 150, 151, 152, 153, 154, 163, 174, 175], "player_count": 174, "player_sum": 163, "playfield": 128, "playplot": [9, 156], "pleas": [2, 5, 7, 18, 136, 148, 155, 156, 159, 163, 171], "plot": [1, 9, 161, 163, 173, 174, 175], "plot_nam": 9, "plot_q_values_map": 175, "plot_states_actions_distribut": 175, "plot_steps_and_reward": 175, "plot_surfac": 174, "plotter": 9, "plt": [161, 163, 173, 174, 175, 177, 178], "plu": [7, 151, 152, 156, 161, 163], "plugin": [155, 156], "pm": 129, "png": [169, 173], "point": [4, 8, 9, 15, 127, 128, 129, 131, 132, 135, 136, 145, 150, 155, 156, 159, 166], "pointless": 156, "pole": [2, 130, 136, 142, 143, 148, 158, 177], "pole2": 142, "pole_angl": 158, "pole_angular_veloc": 158, "poli": 148, "polici": [2, 14, 18, 19, 130, 136, 137, 138, 139, 140, 141, 146, 147, 148, 155, 156, 157, 158, 161, 163, 166, 169, 175, 178], "policy_grid": 174, "policy_mean_net": 177, "policy_network": 177, "policy_stddev_net": 177, "polygon": 155, "pomdp": 3, "pong": [17, 156, 160], "pontryagin": 129, "pool": [17, 146], "poorli": 159, "pop": [2, 155, 156], "pop_fram": 17, "popular": [14, 17, 126, 148, 156, 163, 174], "pose": 148, "posit": [2, 6, 7, 8, 9, 11, 13, 17, 127, 128, 129, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 151, 152, 153, 154, 156, 158, 159, 165, 167, 174], "position_fingertip": 145, "position_target": 145, "possibl": [2, 5, 6, 7, 8, 14, 16, 17, 129, 131, 132, 133, 134, 136, 138, 140, 143, 146, 151, 152, 153, 154, 155, 156, 158, 159, 161, 163, 165, 169, 173, 174, 175], "possibli": [7, 13, 15, 17, 159, 178], "post": [155, 156, 160, 175], "postprocess": 175, "potenti": 156, "pow": 178, "power": [17, 128, 129, 134, 142, 143, 148, 177], "pp": 154, "ppo": 171, "pprint": [14, 156], "pprint_registri": [2, 4, 156, 158, 159], "pr": [140, 148, 155, 156], "practic": [148, 155, 158, 160, 163, 166, 173, 174], "practition": 161, "pre": [4, 5, 153, 156, 165], "precis": [6, 155], "predefin": 165, "predict": [139, 148, 163, 177, 178], "predominantli": 3, "prefix": 161, "preload": 153, "premad": 148, "prematur": 2, "prepend": [9, 17], "preprocess": [9, 17, 20, 155, 156], "present": [131, 148, 155, 161, 166, 174], "preserv": [160, 166], "press": [7, 9, 128, 131, 158], "pressur": 159, "pretti": [4, 156, 175], "prevent": [3, 7, 11, 155, 156, 158, 159, 160, 173], "previou": [17, 156, 166, 167], "previous": [4, 9, 18, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156], "primarili": [148, 156], "primaryclass": 156, "principl": 129, "print": [4, 156, 158, 159, 161, 163, 165, 167, 169, 173, 175, 177, 178], "print_registri": 4, "prior": 4, "priori": 148, "privat": 165, "prng": [2, 5, 6, 7], "proabil": [151, 152], "prob": [177, 178], "proba_frozen": 175, "probabl": [5, 6, 7, 16, 20, 151, 152, 153, 154, 156, 160, 163, 166, 174, 175, 177, 178], "problem": [17, 129, 132, 135, 137, 140, 141, 142, 143, 146, 148, 150, 154, 156, 157, 158, 160, 162, 163, 166, 169, 173, 178], "procedur": 177, "proceed": 131, "process": [9, 10, 11, 13, 14, 18, 131, 148, 156, 158, 165, 166, 178], "process_ev": 9, "produc": [2, 17, 20, 155, 156, 165], "product": [6, 7, 177], "program": [10, 11, 12, 148, 156], "progress": [6, 9, 156, 159, 161, 163, 178], "project": [9, 148, 155, 156, 159, 160, 161, 165, 174], "prompt": 156, "propag": 175, "proper": [155, 158], "properli": [1, 5, 155, 158, 159, 160, 169], "properti": [2, 5, 10, 11, 12, 14, 15, 18, 19, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 166], "proport": 178, "propos": [16, 156], "protocol": 17, "prototyp": 148, "prove": 148, "prover": 148, "provid": [2, 5, 6, 7, 9, 10, 11, 14, 16, 17, 18, 20, 126, 127, 131, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 160, 161, 162, 163, 165, 171, 173, 174], "psc": 155, "pseudo": [155, 156, 178], "pseudorandom": [5, 7], "publicli": 156, "publish": 156, "pull": [18, 19, 155], "pump": 165, "pure": 163, "purpos": [3, 5, 155, 160, 161], "push": [129, 132, 136, 142, 143, 148, 156, 158, 177], "pusher": [136, 156], "pusher_v5": 144, "put": [155, 165, 175], "puzzl": 148, "py": [1, 9, 126, 127, 128, 129, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 151, 152, 155, 156, 165, 166, 167, 169, 173, 174, 175, 177, 178], "pybullet": 148, "pycharm": 156, "pydoc": 155, "pyflyt": [148, 156], "pygam": [2, 9, 126, 155, 156, 165], "pyglet": 155, "pypi": [155, 156], "pyplot": [161, 163, 173, 174, 175, 177, 178], "pyproject": 165, "pyright": [2, 155, 156], "pystk2": 148, "python": [1, 17, 126, 127, 128, 129, 148, 155, 156, 157, 158, 159, 160, 165, 166, 167, 169, 170, 171, 173, 174, 175, 177, 178], "pytorch": [14, 17, 20, 156, 162, 171, 177], "q": [154, 161, 166, 170, 171, 173, 176, 178], "q_": 166, "q_tabl": 173, "q_target": 166, "q_updat": 175, "q_valu": [154, 163, 174], "qfrc_actuat": [140, 141], "qfrc_constraint": 142, "qgallouedec": 156, "qlearn": 175, "qpo": [136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "qtabl": 175, "qtable_best_act": 175, "qtable_direct": 175, "qtable_directions_map": 175, "qtable_val_max": 175, "quad": 141, "quad_ctrl_cost": 141, "quad_impact_cost": 141, "quadcopt": 148, "quadrotor": 148, "quadrup": [136, 137, 156, 168, 170], "quagla": 155, "qualiti": [10, 148, 156], "quaternion": [137, 140, 141], "queen": 150, "question": [148, 160, 165], "queue": [11, 161], "quicker": 178, "quickli": [133, 148, 163, 174, 175], "quit": [11, 156, 165], "qvel": [136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "qwop": 148, "r": [1, 7, 14, 17, 19, 131, 135, 148, 150, 151, 152, 154, 161, 167, 169, 173, 175, 177], "r_": 178, "r_elbow_flex_joint": 144, "r_forearm_roll_joint": 144, "r_shoulder_lift_joint": 144, "r_shoulder_pan_joint": 144, "r_t": 166, "r_upper_arm_roll_joint": 144, "r_wrist_flex_joint": 144, "r_wrist_roll_joint": 144, "race": [126, 148, 155], "racecar": 148, "racecar_gym": 148, "racing_dream": 148, "rad": [131, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "radian": [129, 131, 132, 135, 143], "rafaelcp": 156, "raghuspacerajan": 155, "rainbow": [171, 177], "raini": 156, "rais": [2, 4, 7, 8, 9, 11, 12, 13, 15, 17, 18, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 178], "ram": 162, "rand": 155, "randint": [155, 173], "randn": 155, "random": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 17, 18, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 145, 146, 147, 153, 154, 155, 156, 158, 159, 161, 163, 165, 173, 174, 175, 177], "randomize_domain": 178, "randomize_ob": 128, "randomli": [5, 6, 9, 129, 153, 155, 156, 158, 159, 163, 165, 175, 178], "randomnumbergener": 155, "randomst": 155, "rang": [7, 9, 13, 14, 16, 17, 18, 20, 127, 130, 131, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 163, 165, 167, 169, 170, 172, 173, 174, 175, 176, 177, 178], "rangefind": 127, "raphajan": 156, "rapidli": 148, "rare": [7, 155], "rate": [144, 145, 148, 161, 163, 174, 175, 177, 178], "rather": [2, 4, 6, 128, 155, 156, 161, 174, 178], "raw": [156, 159, 161, 169], "rayerdyn": 156, "rcparam": 177, "rdnfn": 155, "re": [1, 155, 156, 158, 160, 161, 163, 165, 173, 175, 177], "reach": [2, 4, 17, 18, 20, 130, 131, 132, 133, 134, 136, 148, 151, 152, 153, 154, 156, 159, 160, 165, 166, 171, 174, 175, 177], "reachabl": 154, "reacher": [136, 156, 167], "reacher_weighted_reward": 165, "reacherrewardwrapp": 167, "read": [2, 5, 10, 13, 19, 131, 137, 140, 141, 155, 156, 159, 163], "read_from_shared_memori": [5, 13], "readabl": [5, 6, 156, 159], "reader": [162, 169], "readi": [158, 169, 174], "readm": [155, 156, 165], "readthedoc": 18, "real": [9, 138, 148, 158, 173], "realist": [136, 148], "realli": [156, 159, 169, 174], "rear": 128, "reason": [2, 17, 129, 148, 155, 156, 159, 160, 169], "rebuild": 1, "receiv": [9, 18, 19, 20, 128, 129, 134, 147, 154, 155, 157, 158, 163, 166, 174, 177, 178], "recent": [13, 14, 17, 18, 19, 156, 161], "recent_reward": 161, "recogn": 156, "recommend": [3, 4, 9, 11, 17, 129, 136, 137, 140, 141, 155, 156, 159, 169, 174, 178], "reconstruct": 158, "record": [4, 9, 17, 20, 127, 148, 155, 156, 158, 160, 163, 177, 178], "recordconstructorutil": 156, "recorded_fram": 156, "recordepisodestat": 155, "recordepisodestatist": [14, 17, 20, 155, 156, 161, 163, 174, 177, 178], "recordvideo": [17, 20, 155, 156, 161], "recordvideov0": 156, "recreat": 156, "recreated_env": 156, "rect": 165, "red": [154, 155, 165, 173], "redirect": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125], "redtachyon": [155, 156], "reduc": [132, 148, 162, 163, 171, 173, 174, 178], "redund": 155, "refactor": [155, 156], "refer": [2, 4, 5, 7, 9, 136, 156, 157, 162, 165, 166, 169], "referenc": 156, "reflect": [18, 132, 155, 156], "refresh": 175, "regard": 130, "regardless": [137, 138, 139, 140, 141, 146, 147, 169], "regex": 4, "reginald": 156, "regist": [13, 155, 156], "register_env": [17, 156, 160], "registr": [4, 155, 156, 165], "registri": [4, 155, 156], "regress": [9, 156], "regularli": 156, "reinforc": [2, 5, 131, 146, 148, 149, 150, 151, 152, 154, 155, 156, 157, 162, 166, 170, 171, 173, 174, 175, 176, 178], "reiniti": [155, 177], "rel": [131, 140, 141, 156, 165, 167, 178], "relat": [129, 132, 137, 139, 140, 141, 142, 143, 144, 145, 147, 148, 156, 177], "relative_posit": 165, "relativeposit": [165, 167], "releas": [10, 11, 12, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 165], "relev": [155, 165], "reli": 136, "reliabl": 163, "relu": [14, 178], "remain": [18, 151, 152, 155, 160, 165, 166], "remak": 178, "rememb": [17, 128, 163, 165, 167], "remind": [156, 169, 173], "remot": [148, 156], "remov": [2, 4, 17, 18, 137, 138, 139, 140, 141, 145, 146, 147, 154, 155, 156], "renam": [14, 17, 18, 138, 140, 155, 156, 177], "render": [2, 3, 4, 10, 14, 15, 17, 18, 20, 126, 127, 137, 138, 139, 140, 146, 147, 148, 155, 156, 158, 161, 167, 174, 175], "render_clos": 3, "render_fp": [2, 9, 17, 156, 165], "render_imag": 3, "render_init": 3, "render_kei": 18, "render_mod": [2, 3, 9, 10, 15, 17, 18, 127, 128, 131, 132, 133, 134, 135, 136, 155, 156, 157, 158, 159, 160, 161, 165, 169, 175, 178], "render_onli": 18, "render_st": 3, "rendercollect": [2, 17, 20, 156], "renderedfram": [17, 20], "renderfram": [2, 9, 10, 14, 15], "renderstatetyp": 3, "renorm": 129, "rep": 175, "repeat": [4, 16, 18, 20, 156, 158, 159, 163, 175], "repeat_action_dur": 16, "repeat_action_prob": 16, "repeatedli": 158, "rephras": 155, "replac": [17, 18, 137, 146, 150, 155, 156, 158, 161, 163, 165, 169, 174], "replay_buff": 156, "repo": [1, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156], "report": [127, 137, 140, 141, 155, 156, 160], "repositori": [136, 155, 171], "repres": [2, 6, 7, 9, 18, 129, 131, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 153, 154, 155, 156, 157, 158, 159, 165, 169, 175, 177], "represent": [2, 156, 166], "reproduc": [2, 6, 148, 156, 159, 160, 173, 175], "request": [18, 150, 156], "requir": [1, 2, 5, 6, 9, 11, 14, 18, 136, 147, 155, 156, 159, 162, 163, 165, 169, 174, 177, 178], "rerun": 156, "res_al": 175, "rescal": [14, 16, 18, 20, 158], "rescale_act": 155, "rescaleact": [14, 15, 16, 20, 156, 158], "rescaleobserv": [14, 18, 20, 156], "research": [136, 142, 148, 154, 156, 160, 162], "reseed_sampl": 156, "reseed_valu": 156, "reset": [2, 3, 4, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 146, 147, 151, 152, 153, 154, 155, 156, 157, 158, 161, 163, 169, 173, 174, 175, 177, 178], "reset_async": 156, "reset_clean": 17, "reset_noise_scal": [137, 138, 139, 140, 141, 142, 143, 146, 147, 169], "reset_qt": 175, "reset_wait": 156, "resetneed": 17, "reshap": [14, 18, 20, 175], "reshape_env": 18, "reshapeobserv": [14, 18, 20], "resiz": [14, 17, 18, 20, 156], "resized_env": 18, "resizeobserv": [14, 18, 20, 156], "resolv": 155, "resourc": [10, 11, 12, 159, 160, 165, 174], "respect": [14, 15, 17, 129, 131, 137, 138, 139, 140, 141, 146, 147, 155, 156, 158, 167, 178], "respectivesli": 14, "respond": [158, 174], "rest": [128, 129, 139, 147, 156, 159, 178], "restart": 158, "restor": [137, 138, 139, 140, 141, 146, 147, 163], "restrict": 156, "result": [2, 6, 8, 11, 12, 13, 17, 129, 131, 132, 136, 137, 140, 141, 142, 145, 149, 151, 152, 154, 155, 156, 158, 159, 160, 161, 174, 175, 178], "retriev": 4, "retro": [148, 156], "return": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 127, 136, 137, 138, 139, 140, 141, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 158, 159, 160, 163, 165, 166, 167, 173, 174, 175, 177, 178], "return_info": [2, 155], "return_queu": [14, 17, 161, 163, 174, 177, 178], "reveal": [150, 161], "revers": [5, 8, 150, 177, 178], "revert": [155, 156], "revisit": 17, "rew": [9, 14, 17, 19, 166], "reward": [2, 3, 4, 9, 10, 11, 12, 15, 17, 18, 20, 148, 155, 156, 157, 158, 160, 161, 163, 165, 166, 167, 173, 174, 175, 177, 178], "reward_al": 140, "reward_control": [144, 145], "reward_control_weight": [144, 145], "reward_ctrl": [14, 137, 139, 140, 144, 145, 147, 167], "reward_ctrl_weight": 167, "reward_dist": [144, 145, 167], "reward_dist_weight": [144, 145, 167], "reward_forward": [137, 138, 139, 140, 146, 147], "reward_fwd": 146, "reward_linvel": 140, "reward_moving_averag": [163, 174], "reward_near": 144, "reward_near_weight": [144, 145], "reward_over_episod": 177, "reward_quadctrl": 140, "reward_rang": 156, "reward_run": [14, 138], "reward_scal": 159, "reward_surv": [137, 139, 140, 142, 143, 147], "reward_threshold": [4, 137, 138, 139, 140, 141, 144, 145, 146, 147, 156, 165], "rewards_df": 175, "rewards_over_se": 177, "rewardtyp": [3, 156], "rewardwrapp": [14, 15, 19, 169], "rewrit": [155, 156], "rgb": [2, 14, 17, 18, 20, 128, 137, 138, 139, 140, 146, 147, 155, 156, 158], "rgb_arrai": [2, 3, 9, 17, 18, 20, 127, 128, 131, 132, 133, 134, 135, 136, 155, 156, 158, 160, 161, 165, 169, 175, 178], "rgb_array_list": [2, 9, 17, 155], "rgbd": 156, "rgbd_tupl": 136, "richard": 175, "ride": [158, 163], "right": [2, 7, 127, 128, 129, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 146, 147, 151, 152, 153, 154, 156, 158, 159, 163, 165, 173, 174, 175, 177], "right_back_leg": 137, "right_elbow": [140, 141], "right_foot": [140, 141], "right_hip_i": [140, 141], "right_hip_x": [140, 141], "right_hip_z": [140, 141], "right_kne": [140, 141], "right_lower_arm": [140, 141], "right_shoulder1": [140, 141], "right_shoulder2": [140, 141], "right_sin": [140, 141], "right_thigh": [140, 141], "right_upper_arm": [140, 141], "rigid": [140, 141], "risk": 148, "riski": 148, "rl": [9, 17, 148, 156, 157, 159, 160, 161, 163, 166, 169, 170, 172, 174, 176, 177], "rlbook2020": [150, 151, 152], "rmsprop": 178, "rnd": [155, 156], "rng": [2, 3, 5, 6, 7, 9, 10, 155, 156, 165, 175], "road": [128, 156], "roadmap": 156, "robertoschiavon": 156, "robo": 148, "robot": [127, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 160, 166, 168, 170], "robust": [148, 173, 178], "rocket": [129, 148], "rodrigo": 156, "rodrigodelazcano": [155, 156], "rogerjl": 156, "rohan138": 155, "roll": [18, 20, 144, 174], "rolling_length": [163, 174, 178], "rollout": [154, 156], "rom": [155, 156], "ronald": 177, "root": [6, 137, 140, 141, 156], "rooti": [138, 139, 147], "rootx": [138, 139, 147], "rootz": [138, 139, 147], "rotat": [129, 131, 137, 140, 141, 144, 155, 174], "rotor": [137, 138, 139, 140, 141, 146, 147], "roughli": 136, "roulett": 155, "roundtrip": 17, "row": [151, 152, 153, 159, 163, 175], "rpg": 153, "rr": 156, "rstride": 174, "rule": [148, 150, 159, 163, 174], "run": [1, 2, 4, 10, 11, 12, 14, 17, 18, 19, 127, 129, 131, 136, 137, 138, 139, 140, 146, 147, 148, 151, 152, 155, 156, 158, 160, 161, 162, 165, 169, 178], "run_": 1, "run_env": 175, "run_gymnasium_env": 165, "runner": 136, "running_g": 177, "runningmeanstd": [14, 18, 19], "runtim": 178, "runtimeerror": [11, 12, 178], "rushivarora": 155, "rusu24edward": [155, 156], "ryanrud": 155, "r\u00e9mi": 146, "s_": 178, "sab": [150, 163, 174], "safe": [129, 148, 156, 158], "safeti": [148, 155, 156, 159], "sai": [17, 155, 163, 167], "said": [3, 140], "same": [4, 5, 6, 8, 9, 10, 11, 12, 13, 14, 16, 18, 20, 127, 128, 131, 136, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 154, 155, 156, 159, 160, 162, 163, 166, 169, 174, 178], "sampl": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 17, 18, 19, 129, 144, 154, 155, 156, 157, 158, 160, 161, 162, 163, 165, 169, 174, 175, 177, 178], "sample_act": 177, "sample_mask": 6, "sample_n": 5, "sample_phas": 178, "samplefactori": 156, "sander": 156, "saniti": 175, "sarsa": 163, "sashashura": [155, 156], "satisfi": 2, "satur": 148, "save": [14, 17, 155, 156, 158, 161, 163, 167, 173, 175], "save_logg": 9, "save_video": [9, 155], "save_videos1": 17, "save_videos2": 17, "save_videos3": 17, "save_weight": 178, "savefig": 173, "savefig_fold": 173, "sb3": 155, "scalabl": 148, "scalar": [7, 14, 16, 155], "scale": [14, 17, 18, 19, 129, 137, 138, 139, 140, 141, 142, 143, 146, 147, 148, 156, 162, 178], "scale_and_shift": 14, "scale_ob": 17, "scenario": [128, 148, 161, 173], "scene": [2, 148, 156, 169], "sched": 148, "schedul": [9, 148, 153], "scheme": 128, "schulhoff": 156, "schulman": [137, 178], "scienc": 163, "scope": [2, 166], "score": [127, 129, 158, 159], "scoreboard": 155, "scratch": [177, 178], "screen": [17, 137, 138, 139, 140, 146, 147, 155, 156, 158], "screen_siz": 17, "script": [1, 148, 161, 174], "sdl": 156, "seaborn": [174, 175, 177], "search": 156, "sebastian": 156, "second": [1, 6, 9, 10, 17, 129, 132, 142, 145, 146, 148, 156, 161, 162, 169], "section": [16, 128, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 160, 165, 174, 175], "see": [1, 2, 5, 6, 9, 10, 11, 12, 17, 128, 129, 131, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 153, 155, 156, 158, 159, 160, 161, 163, 165, 169, 175, 178], "seed": [2, 3, 4, 5, 6, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 131, 132, 133, 134, 135, 136, 155, 156, 157, 158, 159, 161, 165, 173, 175, 177, 178], "seeded_valu": 156, "seem": [158, 175], "seen": [131, 159], "segment": 146, "select": [5, 7, 9, 136, 156, 158, 169, 173, 178], "select_act": 178, "self": [5, 6, 7, 9, 14, 18, 19, 134, 148, 156, 159, 163, 165, 167, 174, 175, 177, 178], "semant": 155, "send": 14, "sens": [7, 159, 169, 175], "sensor": [128, 169], "sent": 155, "separ": [5, 17, 156, 159, 160, 165, 178], "sepsi": 148, "sequenc": [2, 4, 5, 6, 7, 8, 11, 12, 13, 14, 18, 148, 155, 156, 158, 159], "sequenti": [161, 177, 178], "seri": [6, 158], "serial": [12, 178], "serv": [3, 5, 137, 138, 139, 140, 141, 146, 147, 161], "server": 156, "set": [2, 4, 5, 6, 7, 9, 10, 11, 12, 15, 16, 17, 18, 20, 126, 129, 130, 131, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 155, 156, 159, 160, 161, 165, 166, 167, 169, 171, 173, 174, 175, 177, 178], "set_attr": [11, 12, 156], "set_color": 175, "set_linewidth": 175, "set_mod": 165, "set_np_random_through_se": [2, 10], "set_rotate_label": 174, "set_stat": 155, "set_them": 175, "set_titl": [163, 174, 175, 178], "set_vis": 175, "set_wrapper_attr": [15, 156], "set_xlabel": [163, 174, 178], "set_xtick": 175, "set_xticklabel": 174, "set_ylabel": [163, 174], "set_yticklabel": 174, "set_zlabel": 174, "setup": [155, 161, 173], "seungjaeryanle": 155, "seven": 147, "sever": [2, 4, 7, 10, 17, 129, 155, 156, 158, 159, 161, 173, 175], "sfff": 153, "sfffffff": 153, "shape": [2, 5, 6, 7, 8, 10, 11, 13, 14, 16, 17, 18, 20, 131, 132, 133, 134, 135, 137, 140, 141, 150, 151, 152, 153, 154, 155, 156, 158, 159, 165, 167, 175, 177, 178], "share": [5, 11, 156, 161, 177], "shared_featur": 177, "shared_memori": [11, 13], "shared_net": 177, "sheet": 163, "shen": 156, "shift": 7, "shimmi": [156, 160], "shin": [138, 140, 141], "shinrl": 148, "shoot": 11, "short": [136, 155, 160, 163], "shorthand": 155, "should": [1, 2, 5, 7, 9, 10, 11, 12, 13, 14, 17, 136, 145, 155, 156, 158, 159, 162, 163, 165, 166, 167, 169, 174, 178], "shoulder": 144, "shouldn": [156, 159, 165], "show": [3, 136, 150, 155, 156, 158, 160, 161, 163, 165, 167, 169, 170, 172, 173, 174, 175, 176, 177, 178], "showcas": [164, 168, 170, 174], "shown": [128, 131, 166], "shrink_act": 14, "siddarth": [156, 177], "side": [13, 129, 175], "sign": [142, 143, 177], "signal": [2, 17, 137, 139, 140, 147, 154, 158, 165, 166, 175], "signific": [148, 156, 160, 161, 169], "significantli": [155, 156, 173, 178], "silenc": 9, "silent": 156, "silver": [175, 178], "sim": [148, 175], "similar": [6, 10, 144, 155, 156, 159, 165], "similarli": [129, 156], "simlat": 136, "simonini": 175, "simoninithoma": 175, "simpl": [127, 148, 149, 157, 158, 160, 161, 163, 166, 177], "simplegrid": 148, "simpler": 158, "simplest": 178, "simpli": [14, 16, 17, 18, 19, 165], "simplic": 148, "simplifi": [135, 155, 156], "simplist": 165, "simul": [2, 136, 140, 141, 142, 143, 148, 156, 159, 174, 175, 177], "simultan": [156, 159], "sin": [129, 135, 142, 145], "sinc": [5, 14, 17, 126, 132, 141, 145, 154, 155, 156, 159, 165, 166, 169, 175], "sine": [131, 142, 145], "singl": [2, 3, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 18, 20, 139, 147, 148, 155, 156, 158, 159, 160, 162, 165, 174, 177], "single_action_spac": [10, 13, 14, 156, 178], "single_func": 14, "single_observation_spac": [10, 11, 14, 156, 178], "single_rgb_arrai": 155, "sinusoid": [133, 134], "site": 155, "situat": [154, 158, 163], "six": 147, "size": [5, 13, 14, 17, 148, 153, 155, 156, 159, 165, 169], "sjmikler": 156, "skeleton": 165, "skill": [159, 161], "skip": [9, 17, 18, 20, 155, 156, 160, 165], "skip_and_max_ob": 18, "skip_close_check": 9, "skip_render_check": 9, "sleep": 129, "slide": [138, 139, 142, 143, 144, 145, 146, 147], "slider": [142, 143], "slider1": 146, "slider2": 146, "slight": 127, "slightli": [9, 127, 136, 137, 140, 141, 142, 145, 163], "slime": 148, "slimevolleygym": 148, "slipperi": [151, 153], "slow": [156, 174], "slowdown": 9, "slower": [129, 163, 178], "small": [127, 148, 149, 155, 156, 159, 163, 177], "smallest": 7, "smart": 148, "smarter": 158, "smooth": [161, 163], "smoother": [155, 174], "sn": [174, 175, 177], "snake_cas": 1, "snippet": [9, 17], "snow": 153, "so": [1, 9, 11, 14, 17, 18, 20, 129, 130, 137, 138, 139, 140, 141, 144, 145, 146, 147, 151, 152, 153, 155, 156, 159, 161, 163, 165, 166, 167, 169, 174, 175, 178], "soft": 148, "softmax": 178, "softrobot": 148, "softwar": [2, 148, 156], "sokoban": 148, "sole": [155, 156], "solut": [129, 156, 174], "solv": [2, 127, 130, 132, 136, 142, 143, 148, 159, 160, 163, 165, 170, 176, 177], "some": [2, 5, 6, 7, 10, 11, 12, 14, 15, 128, 130, 131, 145, 146, 154, 155, 156, 158, 160, 161, 163, 165, 167, 169, 174, 175, 178], "someth": [155, 156, 169], "sometim": [9, 137, 151, 152, 153, 158, 159, 161, 165, 167], "sonelu": 156, "soon": [155, 165], "sophist": [159, 161], "sort": 7, "sourc": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 136, 148, 154, 155, 156, 165, 166, 167, 169, 170, 173, 174, 175, 177, 178], "south": [154, 173], "space": [2, 9, 10, 11, 12, 14, 15, 16, 17, 18, 20, 136, 148, 149, 155, 156, 163, 165, 167, 175, 177, 178], "spacecraft": 148, "spaces_kwarg": 6, "span": 17, "sparisi": 156, "spark": 148, "spars": [131, 159, 165], "spatial": 159, "spawn": [11, 145, 178], "spec": [2, 3, 4, 10, 15, 17, 156], "special": [156, 177], "specialis": 156, "specialist": 162, "specif": [2, 4, 7, 10, 14, 17, 136, 155, 156, 159, 161, 166, 177, 178], "specifi": [2, 5, 6, 7, 9, 14, 16, 17, 18, 20, 126, 127, 128, 129, 130, 135, 137, 138, 139, 140, 141, 143, 146, 147, 149, 153, 154, 155, 156, 158, 160, 161, 165, 167], "speed": [10, 127, 128, 156, 158, 160, 169, 170, 176], "speedup": 178, "spell": 155, "spent": [127, 129], "sphere": 144, "spheric": 145, "sphinx": 1, "spike": 163, "spine": 175, "spinningup": 177, "split": [147, 156], "squar": [17, 144, 145, 154, 156, 159, 165, 175, 178], "squeez": [177, 178], "st": 175, "st_all": 175, "stabil": [14, 18, 19, 140, 141, 155, 159, 163, 167, 177], "stabl": [18, 148, 155, 156, 163, 165, 171, 173], "stable_baselines3": 18, "stack": [6, 17, 18, 20, 156, 177], "stack_siz": 18, "stacked_env": 18, "stage": [17, 156, 161], "stai": [158, 159, 163, 178], "stand": [127, 136, 137, 139, 140, 141, 142, 143, 147, 156, 163, 174], "standard": [18, 19, 148, 155, 156, 157, 163, 173, 177, 178], "standard_norm": 155, "standup": 136, "stare": 161, "start": [1, 2, 5, 7, 9, 11, 13, 17, 136, 156, 157, 158, 160, 161, 163, 174, 175, 177, 178], "start_epsilon": [163, 174], "state": [2, 3, 4, 17, 18, 20, 130, 136, 148, 149, 155, 156, 158, 160, 163, 166, 169, 173, 174, 175, 177, 178], "state_dict": 178, "state_info": 3, "state_s": 175, "state_valu": [174, 178], "state_value_pr": 178, "statefulli": 3, "stateless": [3, 156], "statement": [156, 160], "statetyp": [3, 156], "stationari": 178, "statist": [9, 14, 17, 18, 19, 129, 156, 161, 173, 177], "stats_kei": [14, 17], "std": [14, 161, 163, 173, 177], "std_reward": [161, 173], "stderr": 155, "steer": [128, 159], "stefanbschneid": 156, "step": [2, 3, 4, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 127, 129, 131, 132, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 151, 152, 153, 154, 155, 156, 157, 161, 162, 166, 167, 173, 174, 175, 177, 178], "step_api_compat": 9, "step_async": 156, "step_count": 161, "step_index": 9, "step_info": 3, "step_penalti": 159, "step_return": 9, "step_starting_index": 9, "step_trigg": [9, 17], "step_wait": 156, "stepapicompat": 156, "steppabl": 148, "steps_df": 175, "stick": [150, 174], "sticki": 16, "stickyact": [16, 20, 156], "still": [9, 155, 156, 163, 167, 173, 174, 178], "stochast": [16, 130, 131, 133, 134, 136, 151, 152, 155, 175], "stock": 148, "stool": 153, "stop": [17, 150, 156, 158, 163, 166, 174], "stopiter": 13, "storag": 148, "store": [4, 9, 14, 17, 156, 173, 177], "str": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 174, 175, 177], "straightforward": 160, "strang": 156, "strateg": [133, 134, 159], "strategi": [148, 158, 159, 160, 162, 174], "strict": [2, 155, 156], "strictli": 17, "striker": 155, "string": [2, 4, 5, 7, 9, 14, 18, 155, 156, 158, 159, 165], "stringio": 2, "stronger": 169, "structur": [3, 5, 6, 8, 156, 158, 159, 165], "struggl": 161, "stump": 127, "style": [2, 4, 10, 148, 155, 156, 160, 177], "sub": [6, 10, 11, 12, 14, 156, 162], "subclass": [14, 155], "subject": 146, "submit": [148, 155], "suboptim": 163, "subplot": [163, 174, 175, 178], "subprocess": 11, "subse": 155, "subsect": 169, "subsequ": [6, 155, 160], "subset": [7, 156, 167], "subspac": [5, 6, 7, 8, 14, 18, 155], "substanti": [156, 162], "subtl": 160, "subtract": 178, "succeed": 158, "success": [131, 154, 156, 158, 159, 160, 161, 166], "successfulli": [2, 154, 158, 163, 169], "suffici": [159, 174], "suggest": [155, 163, 178], "suit": [148, 155], "suitabl": [148, 149], "sum": [6, 7, 17, 129, 150, 156, 161, 174, 175, 177], "summaris": 156, "sumo": 148, "super": [2, 14, 15, 148, 155, 159, 165, 167, 177, 178], "superclass": [5, 16, 19], "supersuit": 156, "supertuxkart": 148, "supervis": 163, "suppli": 166, "support": [2, 5, 6, 8, 9, 10, 17, 18, 20, 137, 138, 139, 140, 141, 143, 146, 147, 148, 155, 156, 158, 159, 165], "supportsfloat": [2, 7, 9, 15, 19, 167, 177], "suppos": 9, "suptitl": [174, 178], "sure": [1, 2, 9, 17, 165, 167, 169], "surfac": [142, 143, 147, 165], "surfarrai": 165, "surround": [17, 20], "survei": 162, "suspend": 146, "sutton": [2, 131, 132, 142, 143, 150, 151, 152, 155, 174, 175], "sutton_barto_reward": [132, 156], "swig": [126, 155, 156], "swim": 136, "swimmer": [136, 147, 155], "swing": [131, 135], "swingup": 135, "switch": [155, 156, 158, 160], "symbol": 148, "symptom": 163, "sync": [4, 9, 10, 12, 14, 132, 156], "synchron": [10, 11, 12, 156], "synchronizedarrai": 13, "syncvectorenv": [4, 10, 132, 156, 159, 162, 178], "syntax": 4, "synthes": 148, "synthesi": [140, 141], "system": [131, 135, 136, 142, 155, 156, 159, 165], "system_check": 6, "systemat": [161, 163], "t": [1, 2, 4, 5, 6, 8, 9, 14, 15, 17, 128, 129, 133, 134, 154, 155, 156, 158, 159, 160, 161, 163, 165, 166, 173, 174, 175, 178], "t_cov": [5, 13], "tabl": [155, 163, 173], "tabular": [148, 163, 170, 176], "tag": 148, "tai": 156, "tailkind": 9, "take": [1, 2, 3, 4, 7, 8, 9, 10, 11, 16, 17, 130, 132, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 154, 155, 158, 159, 163, 167, 173, 174, 175, 177, 178], "taken": [10, 17, 18, 20, 130, 132, 158, 161, 162, 165, 171, 177, 178], "talk": [162, 163, 177], "tall": 137, "tan": 156, "tanh": [129, 177], "target": [18, 131, 136, 144, 145, 154, 159, 160, 163, 165, 166, 167, 178], "target_devic": [14, 17], "target_dur": 9, "target_i": [145, 159], "target_posit": 167, "target_x": [145, 159], "target_xp": [14, 17], "task": [2, 6, 15, 128, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 158, 159, 160, 165, 166, 167, 175, 177], "tassa": [139, 140, 141], "tau": 135, "taxi": [149, 155, 156, 170, 176], "taxi_col": 154, "taxi_row": 154, "taxi_v3_action_masking_comparison": 173, "td": [175, 178], "td3": 171, "td_error": 178, "teach": [158, 163], "team": [155, 156], "technic": [16, 156], "techniqu": [17, 20, 161, 173], "techreport": [133, 134], "tell": [158, 163, 166, 171, 174], "templat": [3, 165], "tempor": 163, "temporal_differ": [163, 174], "temporarili": [13, 163], "ten": [150, 174], "tendon": [140, 141], "tendon_length": [140, 141], "tendon_veloc": [140, 141], "tensor": [14, 17, 20, 177, 178], "term": [2, 14, 18, 130, 131, 136, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 159, 163, 165, 167, 178], "termin": [2, 3, 9, 10, 11, 12, 14, 17, 18, 19, 20, 131, 132, 133, 134, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 161, 163, 165, 167, 174, 175, 177, 178], "terminal_observ": 155, "terminal_on_life_loss": 17, "terminaltyp": [3, 156], "terminate_when_unhealthi": [137, 139, 140, 147, 169], "terminationwrapp": 169, "terrain": [127, 148, 169], "terri": 156, "terribli": 155, "test": [9, 17, 127, 148, 155, 156, 158, 161, 165, 169, 177], "test_ag": 163, "tetri": 148, "text": [2, 5, 7, 8, 13, 150, 151, 152, 153, 154, 155, 156, 158], "textencod": 155, "th": [17, 18, 20], "than": [1, 4, 6, 16, 129, 131, 132, 133, 134, 143, 144, 150, 155, 156, 158, 159, 161, 163, 169, 174, 175, 178], "thank": 156, "theden": 155, "thei": [5, 11, 17, 20, 136, 149, 150, 151, 152, 153, 155, 156, 159, 160, 162, 165, 169, 173, 178], "theirfor": 178, "them": [3, 5, 14, 15, 17, 129, 137, 138, 145, 148, 154, 155, 156, 160, 167, 169, 173, 178], "themselv": 148, "theo": 156, "theorem": 148, "theoret": [148, 155, 156, 163], "theori": [135, 142, 155, 158, 175, 178], "therefor": [2, 5, 17, 137, 140, 141, 145, 147, 155, 156, 170, 172, 176], "thesi": [133, 134, 146], "theta": [135, 155], "theta1": 131, "theta2": 131, "theta_dt": 135, "thi": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 161, 162, 163, 165, 166, 167, 169, 171, 173, 174, 175, 177, 178], "thigh": [138, 139, 140, 141, 147], "thigh_joint": [139, 147], "thigh_left_joint": 147, "thing": [13, 15, 155, 163, 167], "think": [13, 148, 158], "third": [137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 165], "third_party_environ": 155, "thoma": 175, "thoroughli": 159, "those": [13, 14, 131, 155, 159, 167, 175, 178], "though": [6, 11, 155], "thought": [155, 156, 163], "thousand": [156, 161], "thousandth": 17, "thread": 156, "three": [5, 6, 15, 139, 140, 141, 146, 155, 156, 159, 165], "threshold": [4, 131, 132, 154, 165], "throttl": [129, 159], "through": [2, 3, 4, 5, 10, 11, 12, 14, 17, 18, 20, 140, 141, 148, 155, 156, 157, 158, 159, 162, 163, 166, 173], "throw": [156, 167], "thrower": 155, "thrown": 7, "thruster": 129, "thu": [11, 137, 140, 141, 142, 156, 178], "thytu": 156, "ti": 175, "tick": 165, "tight": 173, "tight_layout": [163, 174, 175, 178], "tile": [128, 153, 175], "tileset": 153, "till": [174, 178], "till2": 156, "tilleri": 153, "tilt": 129, "tim": 175, "time": [1, 2, 5, 6, 9, 10, 14, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 128, 132, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 151, 152, 154, 155, 156, 158, 159, 160, 161, 162, 163, 165, 168, 169, 170, 171, 173, 174, 177, 178], "time_limit": [153, 154], "time_queu": [14, 17, 161], "timeawareobserv": [10, 18, 20, 156, 158], "timelaps": 161, "timelimit": [2, 4, 15, 17, 20, 127, 128, 129, 131, 132, 133, 134, 135, 156, 158, 165, 166], "times10": [137, 140, 141], "timestamp": 2, "timestep": [2, 17, 18, 20, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 158, 159, 165, 169, 177, 178], "timgates42": 155, "timschneider42": 156, "tip": [138, 142, 146, 147], "tips_arm": 144, "titl": [9, 133, 134, 156, 161, 173, 174, 175, 177], "tmrl": 148, "to_json": [5, 156], "to_torch": 156, "tobirohr": 156, "toctre": 1, "todorov": [139, 140, 141], "togeth": [5, 12, 136, 160, 175], "toi": [126, 150, 151, 152, 153, 154, 155], "tom": 154, "toml": 165, "ton": 155, "too": [137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 158, 159, 169, 175], "took": 161, "tool": [137, 138, 139, 140, 141, 143, 146, 147, 148, 158, 161], "toolbox": 148, "toolkit": 148, "top": [128, 129, 130, 133, 134, 139, 142, 143, 147, 148, 155, 156, 159, 165, 175, 177], "torch": [2, 14, 17, 20, 156, 177, 178], "torqu": [127, 129, 131, 135, 137, 138, 139, 140, 141, 144, 145, 146, 147], "torso": [137, 138, 139, 140, 141, 147, 169], "toss": 7, "total": [2, 127, 128, 129, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 154, 158, 161, 163, 173, 175, 177, 178], "total_episod": 175, "total_num_episod": 177, "total_reward": [158, 163, 173, 175], "total_timestep": 156, "touch": [14, 159, 165], "touretzki": 131, "toward": [146, 155, 163], "tower": 156, "towers2024gymnasium": 156, "towers_gymnasium_2023": 156, "town": 156, "toy_text": [153, 155, 174, 175], "tpu": 162, "tqdm": [163, 174, 175, 178], "trace": [127, 156], "traceback": [13, 17], "track": [9, 14, 17, 20, 128, 132, 137, 138, 139, 140, 146, 147, 148, 156, 163, 173], "trackmania": 148, "trade": [148, 156, 158, 159], "tradeoff": 178, "traffic": 148, "train": [10, 137, 140, 141, 142, 145, 148, 155, 156, 158, 159, 160, 171, 173, 175], "train_q_learn": 173, "training_env": 160, "training_error": [163, 174], "training_error_moving_averag": [163, 174], "training_period": 161, "training_video": 161, "trajectori": [14, 18, 19, 129, 140, 141], "transfer": [14, 17, 148, 162], "transform": [3, 5, 8, 9, 14, 15, 16, 18, 19, 20, 145, 167], "transformact": [14, 16, 20], "transformob": 156, "transformobserv": [14, 18, 20], "transformreward": [14, 19, 20], "transit": [3, 9, 140, 141, 151, 152, 153, 154, 156, 157, 166, 178], "transition_info": 3, "translat": [137, 140, 141, 156, 159, 165], "transport": 148, "transpos": [9, 165], "treasur": 175, "treat": 158, "treatment": 148, "tremend": 155, "trend": 161, "tri": 156, "trial": [158, 163], "trigaten": 155, "trigger": [9, 17, 154, 161], "tristan": 156, "tristandeleu": 155, "trivial": [158, 159, 165], "true": [2, 4, 6, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 127, 128, 132, 136, 137, 138, 139, 140, 141, 146, 147, 150, 153, 154, 155, 156, 158, 161, 163, 165, 169, 173, 174, 175, 177, 178], "true_": [16, 18], "trunc": [14, 18], "truncat": [2, 4, 9, 10, 11, 12, 14, 17, 18, 19, 20, 128, 131, 132, 133, 134, 153, 154, 155, 156, 157, 158, 159, 161, 163, 165, 167, 169, 173, 174, 175, 177, 178], "trunk": 169, "try": [141, 148, 155, 156, 158, 159, 163, 174], "tuckerbmorgan": 155, "tune": [148, 177], "tupl": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 137, 139, 140, 147, 150, 155, 156, 158, 159, 160, 163, 165, 174, 177, 178], "turbotimon": 156, "turbul": [129, 155], "turbulence_pow": [129, 178], "turn": [9, 11, 17, 128, 129, 142, 148, 155, 156], "tutori": [2, 15, 156, 159, 160, 161, 163, 164, 165, 166, 167, 168, 169, 172, 173, 174, 175, 176, 177, 178], "tutorials_jupyt": 170, "tutorials_python": 170, "tweak": [136, 146], "two": [2, 5, 6, 7, 9, 10, 17, 18, 20, 127, 129, 131, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 145, 146, 147, 148, 150, 155, 156, 159, 161, 162, 165, 174, 178], "txt": [1, 155], "type": [2, 4, 5, 6, 7, 10, 14, 16, 17, 18, 20, 128, 132, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 159, 160, 165, 167, 175, 177], "typeerror": 156, "typic": [2, 9, 154, 159, 161, 169, 173], "typo": [155, 156], "u": [5, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 159, 163, 165, 167, 174, 177], "uav": 148, "uint8": [18, 128], "un": 132, "unattach": [144, 145], "unbound": [7, 18], "uncertain": 148, "uncertainti": 148, "unclear": [156, 159], "uncom": 169, "uncommon": 156, "undefin": 2, "under": [2, 156, 174, 177], "underli": [2, 15, 17, 131, 156, 158], "underneath": [15, 132, 158], "underpow": 130, "underscor": [155, 160], "understand": [2, 8, 10, 144, 156, 159, 160], "undocu": 156, "uneven": 127, "unexpect": [11, 129, 155], "unflatten": [5, 8, 156], "unhealthi": [137, 139, 140, 142, 143, 147], "unicod": 9, "uniform": [5, 7, 8, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 175], "uniformli": [7, 131, 132, 154, 165], "uniniti": 159, "unintend": 156, "union": [6, 7, 19, 156], "uniqu": [6, 10, 126, 130, 136, 142, 155, 160], "unit": [5, 14, 18, 20, 129, 131, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148], "uniti": 148, "unitless": [142, 145], "unitre": 169, "unitree_go1": 169, "univers": [133, 134, 175], "unknown": [2, 9, 10, 148, 158], "unless": [7, 15, 150, 151, 152, 153, 154, 155, 165], "unlik": [6, 163, 177], "unmaintain": 156, "unmasked_mean_curv": 173, "unmasked_mean_reward": 173, "unmasked_overall_mean": 173, "unmasked_overall_std": 173, "unmasked_result": 173, "unmasked_results_list": 173, "unnecessari": [155, 156], "unnecessarili": 160, "unnescesari": 155, "unord": 5, "unpack": 160, "unpickl": [9, 13, 155, 156], "unplay": 9, "unreli": 160, "unsupport": 7, "untermin": 132, "until": [17, 144, 150, 151, 152, 153, 155, 156, 158, 163, 165, 175, 177, 178], "unus": [155, 159], "unusu": 161, "unwrap": [2, 10, 15, 131, 156, 158, 159], "up": [2, 6, 7, 10, 127, 129, 136, 137, 139, 140, 141, 147, 150, 151, 152, 153, 154, 156, 158, 159, 161, 163, 165, 169, 170, 173, 174, 175, 176], "updat": [1, 2, 3, 9, 14, 16, 17, 18, 19, 137, 139, 140, 147, 154, 155, 156, 158, 159, 160, 165, 166, 167, 173, 174, 175, 177, 178], "update_paramet": 178, "update_running_mean": [18, 19], "upfront": 160, "upgrad": [155, 156], "uph": 141, "uph_cost": 141, "uph_cost_weight": 141, "upload": 161, "upon": [133, 134, 160], "upper": [7, 14, 19, 20, 140, 141, 155, 158], "upright": [132, 135, 142, 143, 158], "upsid": 156, "upstream": 156, "urandom": 2, "urban": 148, "urdf": 169, "url": [155, 156, 178], "urldat": 156, "us": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 126, 127, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 153, 154, 155, 156, 158, 160, 161, 162, 163, 166, 167, 169, 170, 173, 174, 176], "usabl": [150, 155, 163, 174], "usable_ac": [163, 174], "usag": [9, 156, 159, 160, 161, 163, 167], "use_action_mask": 173, "use_contact_forc": [137, 156], "use_cuda": 178, "useless": 169, "user": [2, 3, 4, 5, 9, 10, 12, 14, 18, 20, 131, 132, 133, 134, 135, 155, 156, 158, 160, 164, 165, 168, 170, 177], "usual": [2, 6, 7, 17, 139, 158, 163, 165, 167, 169, 174, 178], "util": [18, 148, 155, 156, 158, 159, 165, 178], "utilis": [10, 155], "utli": 156, "v": [4, 133, 134, 160, 173, 178], "v0": [2, 4, 9, 10, 14, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 159, 165, 166, 171, 177], "v1": [2, 4, 9, 10, 11, 12, 14, 16, 17, 18, 19, 127, 128, 129, 131, 132, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 158, 161, 163, 171, 174, 175], "v2": [127, 128, 129, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156], "v21": [155, 156, 160], "v24": 155, "v25": 155, "v26": [2, 156, 160, 177], "v28": 156, "v2g": 148, "v3": [9, 14, 17, 18, 127, 128, 129, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 157, 158, 160, 167, 173, 178], "v4": [14, 15, 16, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 171, 177], "v5": [17, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 160, 169], "vairodp": 156, "val": 175, "valentin": 156, "valid": [2, 4, 5, 7, 10, 13, 14, 158, 163, 173, 174, 178], "valid_act": 173, "valid_next_act": 173, "vallei": [133, 134], "valu": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 127, 129, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 158, 160, 163, 165, 166, 169, 173, 174, 175, 177, 178], "value_funct": 160, "value_grid": 174, "value_pr": 178, "valueerror": [7, 8, 11, 12, 13, 17], "vampir": 148, "var": 19, "vari": [132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 177], "variabl": [2, 5, 7, 11, 13, 14, 15, 17, 136, 137, 139, 146, 147, 148, 155, 156, 158, 165, 166, 174, 177], "varianc": [14, 18, 19, 20, 173, 178], "variant": [128, 165], "variat": 136, "varieti": [9, 148], "variou": [5, 141, 148, 155, 177], "ve": [155, 156, 159, 163], "vec_env": [9, 159], "vecenvwrapp": 155, "vector": [2, 4, 7, 9, 11, 12, 16, 17, 18, 19, 127, 129, 142, 143, 145, 148, 155, 156, 158, 159, 161, 170, 176, 177], "vector_a2c": 178, "vector_entry_point": [4, 132, 156], "vector_env": 14, "vector_kwarg": 4, "vector_list_info": 155, "vectoractionwrapp": [14, 156], "vectorenv": [4, 5, 14, 155, 156], "vectorenvcr": 4, "vectorenvwrapp": 156, "vectoris": [5, 148], "vectorization_mod": [4, 9, 10, 11, 12, 14, 132, 156], "vectorizemod": 4, "vectorizetransformact": [14, 20], "vectorizetransformobserv": [14, 20], "vectorizetransformreward": [14, 20], "vectorizor": [4, 132], "vectorlistinfo": [14, 155, 156], "vectorobservationwrapp": [14, 156], "vectorrewardwrapp": [14, 156], "vectorwrapp": [14, 156], "vehicl": 148, "veloc": [2, 8, 13, 127, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 158, 159], "velocity_penalti": 142, "veri": [6, 129, 144, 155, 156, 158, 159, 162, 163, 165, 178], "verifi": [9, 159, 160, 163], "vermouth1992": [155, 156], "versa": [13, 17, 18, 160], "version": [1, 2, 4, 5, 14, 16, 17, 18, 19, 148, 155, 156, 159, 160, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "vertic": [127, 139, 141, 142, 143, 147, 159, 165], "vf_next_stat": 166, "vf_target": 166, "via": [5, 9, 14, 15, 17, 126, 130, 136, 148, 149, 158, 165, 177], "viabl": 174, "vicbentu": 156, "vice": [13, 17, 18, 160], "vicent": 156, "video": [1, 17, 20, 127, 155, 156, 158, 159, 161, 163, 169, 171, 175], "video0": 169, "video_fold": [9, 17, 161], "video_length": [9, 17], "video_path": 161, "videorecord": [17, 155, 156], "view": [2, 156, 159, 169], "view_init": 174, "viewer": [10, 11, 12, 156], "viewport": 129, "viewport_h": 129, "viewport_w": 129, "virgilt": 155, "viridi": 174, "viscou": 146, "visibl": 165, "visit": [128, 175], "visual": [148, 158, 159, 160, 161, 163, 169], "visual_env": 160, "visual_opt": [136, 156], "visualis": 2, "vizdoom": 148, "vmoen": [155, 156], "voidflight": 156, "vol": [131, 154], "volleybal": 148, "volunt": 156, "vscode": [156, 171], "vwxyzjn": 155, "vx": [14, 17, 129], "vy": 129, "w": [9, 137, 140, 141, 178], "w_": [137, 138, 139, 140, 141, 144, 145, 146, 147], "wa": [2, 4, 6, 9, 10, 14, 17, 18, 19, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 159, 160, 163, 166, 167, 177, 178], "wai": [2, 13, 15, 17, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 163, 166, 167, 174, 175, 178], "wait": [9, 10, 11, 155, 166], "wait_on_play": 9, "wake": 129, "walk": [136, 140, 147, 149, 153, 156, 159, 165, 169], "walker": [126, 145, 147, 155], "walker2d": [136, 156], "walker2d_v5": 147, "wall": [133, 134, 154, 159, 161, 173], "wandb": 161, "want": [1, 2, 4, 6, 11, 15, 17, 137, 140, 141, 155, 156, 158, 159, 160, 161, 165, 167, 169, 174, 175, 178], "ward": 177, "warehous": 148, "warn": [6, 9, 10, 11, 17, 144, 155, 156], "wasn": 17, "wast": 173, "watch": [1, 161, 163, 171], "water": 148, "wawrzy\u0144ski": 138, "we": [1, 2, 3, 4, 5, 7, 9, 13, 18, 148, 155, 156, 157, 158, 159, 160, 161, 162, 163, 165, 166, 167, 169, 173, 174, 177, 178], "web": 148, "websit": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 136, 155, 156], "weigh": 137, "weight": [137, 138, 139, 140, 141, 144, 145, 146, 147, 148, 155, 161, 166, 167, 177], "well": [2, 5, 14, 131, 148, 155, 159, 163, 165, 175, 178], "were": [126, 131, 136, 154, 155, 156, 160, 163, 165, 169, 178], "weren": 160, "west": [154, 173], "what": [2, 5, 6, 148, 151, 152, 156, 159, 161, 162], "wheel": [126, 128, 155], "when": [2, 4, 5, 8, 9, 10, 11, 12, 13, 14, 17, 18, 20, 128, 129, 137, 139, 140, 141, 142, 143, 144, 147, 151, 152, 153, 154, 155, 156, 158, 159, 160, 163, 165, 166, 167, 169, 173, 175, 177, 178], "whenev": [17, 129, 165], "where": [1, 4, 6, 7, 8, 9, 14, 17, 128, 129, 131, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "wherea": 175, "whether": [2, 3, 4, 5, 7, 9, 15, 17, 129, 137, 138, 139, 140, 141, 146, 147, 148, 150, 158, 159, 163, 165, 166, 174, 177], "which": [1, 2, 4, 5, 8, 9, 10, 14, 17, 18, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 160, 162, 165, 166, 167, 169, 171, 173, 175, 177, 178], "while": [4, 8, 9, 11, 14, 17, 18, 19, 129, 131, 132, 135, 137, 140, 141, 146, 150, 151, 152, 155, 158, 159, 160, 161, 163, 165, 166, 173, 174, 175, 177, 178], "white": 155, "who": 156, "whole": [4, 155, 156, 169], "whose": [137, 150], "why": [129, 163], "wide": [148, 158], "width": [136, 156, 165], "wikipedia": 175, "wildli": 163, "willdudlei": 156, "william": [133, 134, 177], "win": [150, 163, 174], "win_rat": 163, "wind": [129, 155, 156], "wind_pow": [129, 155, 178], "window": [2, 9, 128, 136, 155, 156, 158, 160, 161, 163, 165], "window_s": 165, "wing": 148, "wire": 148, "wireless": 148, "wise": 177, "wish": [9, 155, 156], "within": [2, 5, 7, 9, 13, 14, 16, 17, 18, 20, 129, 130, 143, 155, 156, 158, 159], "without": [14, 15, 17, 19, 140, 148, 150, 153, 155, 156, 158, 159, 163, 165, 169, 173, 174], "won": [2, 163, 174], "word": [144, 177], "work": [5, 9, 128, 129, 131, 138, 139, 142, 143, 148, 155, 156, 158, 159, 160, 163], "worker": 11, "workflow": 156, "workshop": 148, "world": [129, 148, 151, 152, 153, 154, 156, 173, 175], "worldbodi": [137, 140, 141], "worri": 165, "wors": [155, 163], "would": [6, 8, 16, 18, 19, 137, 138, 139, 140, 146, 147, 155, 156, 157, 165, 167, 169, 178], "wouldn": 156, "wrap": [2, 4, 9, 11, 12, 14, 15, 16, 17, 18, 19, 20, 148, 158, 159, 165, 167, 177, 178], "wrapped_env": [14, 15, 16, 17, 18, 158, 159, 165, 167, 177], "wrapped_env_ob": 16, "wrapped_obs0": 18, "wrapped_obs1": 18, "wrappedenvacttyp": 156, "wrappedenvobstyp": 156, "wrapper": [2, 4, 6, 7, 9, 10, 13, 137, 138, 139, 140, 141, 143, 146, 147, 148, 153, 154, 155, 156, 158, 161, 163, 168, 170, 174, 177, 178], "wrapper_spec": 15, "wrapperacttyp": [15, 16], "wrapperobstyp": [15, 18], "wrapperspec": [4, 15], "wrist": 144, "write": [5, 11, 13, 156, 159, 165, 169], "write_to_shared_memori": [5, 13], "written": [9, 156, 162], "wrong": [155, 156, 158, 159, 160, 163], "www": [128, 150, 151, 152, 153, 155], "x": [2, 5, 8, 14, 129, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 151, 152, 156, 159, 161, 165, 175, 177, 178], "x_": [137, 138, 139, 140, 142, 146, 147], "x_init": 133, "x_posit": [14, 137, 138, 139, 140, 141, 146, 147], "x_veloc": 14, "xlabel": [161, 173], "xml": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 169], "xml_file": [136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 169], "xp": 14, "xpo": [137, 140, 144, 145], "xtick": 174, "xticklabel": 175, "xuanhien070594": 156, "xuehaipan": [155, 156], "xx": 175, "xy": 142, "y": [2, 129, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 154, 159, 175, 177], "y_": 142, "y_coordin": 142, "y_init": 133, "y_posit": [137, 138, 139, 140, 141, 146, 147], "yaniv": 156, "year": [133, 134, 155, 156], "yellow": 154, "yet": [148, 156], "yield": 13, "ylabel": [161, 173, 175], "you": [1, 2, 5, 6, 7, 8, 9, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 128, 137, 140, 141, 148, 155, 156, 157, 158, 160, 161, 163, 165, 166, 167, 169, 171, 173, 175, 178], "youjiacheng": 155, "youni": [155, 156], "younik": [155, 156], "your": [1, 2, 5, 9, 11, 14, 15, 16, 17, 18, 128, 137, 140, 141, 148, 155, 156, 157, 162, 167, 168, 170, 174, 178], "your_env": 9, "yourself": [11, 128, 159, 165, 174], "ytick": 174, "yticklabel": 175, "z": [137, 138, 139, 140, 141, 142, 144, 145, 147], "z_": 141, "z_distance_from_origin": [139, 141, 147], "zaxi": 174, "zemann": [174, 178], "zenodo": 156, "zero": [7, 13, 18, 135, 137, 139, 140, 141, 147, 156, 163, 165, 166, 173, 174, 175, 177, 178], "zero_grad": [177, 178], "zhiqingxiao": 155, "zip": [170, 173], "zlig": 155, "zoom": 9, "zuoxingdong": 155, "zzyunzhi": 155, "\u03b1": 173, "\u03b3": 173, "\u03b5": 173}, "titles": ["404 - Page Not Found", "Gymnasium-docs", "Env", "Functional Env", "Make and register", "Spaces", "Composite Spaces", "Fundamental Spaces", "Spaces Utils", "Utility functions", "Vectorize", "AsyncVectorEnv", "SyncVectorEnv", "Utility functions", "Wrappers", "Wrappers", "Action Wrappers", "Misc Wrappers", "Observation Wrappers", "Reward Wrappers", "List of Wrappers", "Atari", "Adventure", "Air Raid", "Alien", "Amidar", "Assault", "Asterix", "Asteroids", "Atlantis", "Atlantis2", "Backgammon", "Bank Heist", "Basic Math", "Battle Zone", "Beam Rider", "Berzerk", "Blackjack", "Bowling", "Boxing", "Breakout", "Carnival", "Casino", "Centipede", "Chopper Command", "Crazy Climber", "Crossbow", "Darkchambers", "Defender", "Demon Attack", "Donkey Kong", "Double Dunk", "Earthworld", "Elevator Action", "Enduro", "Entombed", "Et", "Fishing Derby", "Flag Capture", "Freeway", "Frogger", "Frostbite", "Galaxian", "Gopher", "Gravitar", "Hangman", "Haunted House", "Hero", "Human Cannonball", "Ice Hockey", "Jamesbond", "Journey Escape", "Kaboom", "Kangaroo", "Keystone Kapers", "King Kong", "Klax", "Koolaid", "Krull", "Kung Fu Master", "Laser Gates", "Lost Luggage", "Mario Bros", "Miniature Golf", "Montezuma Revenge", "Mr Do", "Ms Pacman", "Name This Game", "Othello", "Pacman", "Phoenix", "Pitfall", "Pitfall2", "Pong", "Pooyan", "Private Eye", "Qbert", "Riverraid", "Road Runner", "Robotank", "Seaquest", "Sir Lancelot", "Skiing", "Solaris", "Space Invaders", "Space War", "Star Gunner", "Superman", "Surround", "Tennis", "Tetris", "Tic Tac Toe 3D", "Time Pilot", "Trondead", "Turmoil", "Tutankham", "Up N Down", "Venture", "Video Checkers", "Video Chess", "Video Cube", "Video Pinball", "Wizard Of Wor", "Word Zapper", "Yars Revenge", "Zaxxon", "Box2D", "Bipedal Walker", "Car Racing", "Lunar Lander", "Classic Control", "Acrobot", "Cart Pole", "Mountain Car", "Mountain Car Continuous", "Pendulum", "MuJoCo", "Ant", "Half Cheetah", "Hopper", "Humanoid", "Humanoid Standup", "Inverted Double Pendulum", "Inverted Pendulum", "Pusher", "Reacher", "Swimmer", "Walker2D", "External Environments", "Toy Text", "Blackjack", "Cliff Walking", "Cliff Walking Slippery", "Frozen Lake", "Taxi", "Gym Release Notes", "Gymnasium Release Notes", "<no title>", "Basic Usage", "Create a Custom Environment", "Gym Migration Guide", "Recording Agents", "Speeding Up Training", "Training an Agent", "Gymnasium Basics", "Make your own custom environment", "Handling Time Limits", "Implementing Custom Wrappers", "Gymnasium Basics", "Load custom quadruped robot environments", "Tutorials", "Third-Party Tutorials", "Training Agents", "Action Masking in the Taxi Environment", "Solving Blackjack with Tabular Q-Learning", "Solving Frozenlake with Tabular Q-Learning", "Training Agents", "Training using REINFORCE for Mujoco", "Speeding up A2C Training with Vector Envs"], "titleterms": {"0": [155, 156, 160, 169], "0a1": 156, "0a2": 156, "1": [155, 156, 160, 169], "11": 175, "12": 155, "19": 155, "2": [155, 156, 160, 169], "20": 155, "21": [155, 160], "22": 155, "23": 155, "24": 155, "25": 155, "26": [155, 156, 160], "27": 156, "28": 156, "29": 156, "3": [155, 156, 160, 169], "3d": 111, "4": [155, 160, 169, 175], "404": 0, "5": [155, 160], "6": 155, "7": [155, 175], "9": [155, 175], "Not": 0, "Of": 122, "The": [0, 160, 163, 175], "__init__": 159, "a2c": 178, "about": [159, 163, 171], "acrobot": 131, "across": 136, "action": [14, 16, 53, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159, 163, 173, 174], "actionwrapp": 167, "actor": 178, "ad": [1, 159], "add": 159, "addit": [4, 10, 11, 12], "advanc": 159, "advantag": 178, "adventur": 22, "agent": [158, 161, 163, 169, 170, 172, 174, 176, 177, 178], "agilerl": 171, "air": 23, "algorithm": 162, "alien": 24, "alpha": 156, "alpha1": 156, "altern": 165, "amidar": 25, "an": [1, 163, 174, 177], "analysi": [173, 178], "analyz": 163, "ant": 137, "api": [9, 160], "argument": [127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "assault": 26, "asterix": 27, "asteroid": 28, "asynchron": 178, "asyncvectorenv": 11, "atari": 21, "atlanti": 29, "atlantis2": 30, "attack": 49, "attribut": [2, 5, 10, 15], "autonom": 148, "avail": 16, "backend": 136, "backgammon": 31, "bank": 32, "base": [3, 16], "basic": [33, 158, 164, 168, 170], "battl": 34, "beam": 35, "befor": 159, "beginn": 158, "benchmark": 9, "benefit": 161, "berzerk": 36, "best": 161, "better": 174, "biolog": 148, "biped": 127, "blackjack": [37, 150, 163, 174], "boundari": 159, "bowl": 38, "box": 39, "box2d": 126, "breakdown": 160, "breakout": 40, "bro": 82, "build": [1, 163, 174, 177], "can": 174, "cannonbal": 68, "captur": 58, "car": [128, 133, 134], "carniv": 41, "cart": 132, "casino": 42, "centiped": 43, "chang": 160, "check": [9, 159], "checker": 118, "cheetah": 138, "chess": 119, "chopper": 44, "class": 16, "classic": 130, "cliff": [151, 152], "climber": 45, "close": 165, "code": [158, 159, 160, 166, 171], "command": 44, "common": [14, 17, 158, 159, 163], "compar": 136, "comparison": 160, "compat": [9, 160], "complet": 160, "complex": 159, "composit": [5, 6], "comput": 148, "construct": [159, 165], "continu": 134, "control": 130, "convers": [14, 17], "convert": 3, "core": 4, "could": 0, "crazi": 45, "creat": [2, 159, 165, 175], "credit": [127, 128, 129], "critic": 178, "crossbow": 46, "cube": 120, "curv": 177, "custom": [159, 165, 167, 169], "darkchamb": 47, "data": [14, 17], "debug": 159, "declar": 165, "defend": 48, "demon": 49, "derbi": 57, "descript": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "design": 159, "did": 160, "do": [85, 174], "doc": 1, "document": 1, "domain": 178, "done": 160, "donkei": 50, "doubl": [51, 142], "down": 116, "download": 169, "drive": 148, "dunk": 51, "dure": [161, 163], "dynam": [133, 134], "earthworld": 52, "econom": 148, "edit": 1, "electr": 148, "elev": 53, "end": [131, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "enduro": 54, "energi": 148, "entomb": 55, "env": [2, 3, 165, 178], "environ": [1, 2, 3, 9, 10, 132, 148, 158, 159, 160, 162, 163, 165, 169, 173, 174, 175, 178], "epilogu": 169, "episod": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 161], "error": 159, "escap": 71, "et": 56, "evalu": 161, "everi": 161, "exact": 136, "exampl": 159, "execut": [163, 174], "expect": 163, "experi": [161, 173], "explain": 158, "exploit": 163, "explor": 163, "extern": 148, "ey": 95, "featur": 159, "financi": 148, "first": [148, 158], "fish": 57, "flag": 58, "found": 0, "freecodecamp": 171, "freewai": 59, "frogger": 60, "from": [165, 167, 171], "frostbit": 61, "frozen": 153, "frozenlak": 175, "fu": 79, "function": [3, 4, 5, 9, 13, 159, 160], "fundament": [5, 7], "galaxian": 62, "game": [87, 148], "gate": 80, "gener": [160, 165], "get": [160, 163], "golf": 83, "gopher": 63, "gradual": 159, "gravitar": 64, "gridworld": 159, "guid": 160, "gunner": 106, "gym": [148, 155, 160], "gymnasium": [1, 10, 148, 156, 158, 164, 165, 167, 168, 170, 171], "half": 138, "handl": [159, 166], "hangman": 65, "haunt": 66, "heist": 32, "help": 160, "helper": 160, "hero": 67, "heurist": 162, "histori": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "hockei": 69, "hopper": 139, "hous": 66, "how": 173, "human": 68, "humanoid": [140, 141], "i": 158, "ic": 69, "implement": [2, 14, 18, 19, 167], "import": [166, 174], "improv": 163, "includ": 160, "inform": [150, 151, 152, 153, 154, 161], "inherit": 167, "initi": [156, 158, 165], "instanc": 165, "instruct": 1, "integr": 161, "interpret": 163, "introduct": 178, "intuit": 163, "invad": 104, "invert": [142, 143], "issu": [158, 159, 163], "jamesbond": 70, "jax": 3, "johnni": 171, "journei": 71, "kaboom": 72, "kangaroo": 73, "kaper": 74, "kei": [159, 160], "keyston": 74, "king": 75, "klax": 76, "known": 159, "kong": [50, 75], "koolaid": 77, "krull": 78, "kung": 79, "lake": 153, "lancelot": 101, "lander": 129, "laser": 80, "learn": [158, 159, 163, 166, 174, 175, 177], "librari": 171, "limit": 166, "list": 20, "ll": 175, "load": [160, 169, 178], "loop": [158, 163], "lost": 81, "luggag": 81, "lunar": 129, "m": 86, "make": [4, 10, 159, 165], "manual": 159, "map": 175, "mario": 82, "mask": 173, "master": 79, "math": 33, "mathemat": 148, "medic": 148, "memori": 13, "method": [2, 5, 10, 11, 12, 15], "migrat": 160, "miniatur": 83, "misc": 17, "miscellan": 13, "mode": 160, "model": 169, "modifi": [1, 158], "montezuma": 84, "more": 161, "mountain": [133, 134], "mr": 85, "mujoco": [136, 177], "n": 116, "name": [87, 160], "network": 177, "never": 163, "new": [1, 9, 160], "next": [158, 159, 163], "note": [129, 146, 155, 156], "notic": 178, "number": 160, "observ": [14, 18, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159, 165, 169, 174], "observationwrapp": 167, "old": [9, 160], "onli": [14, 20], "openai": 160, "optim": 162, "othello": 88, "other": [1, 148], "output": 161, "own": 165, "packag": [160, 165], "pacman": [86, 89], "page": [0, 1], "paramet": [169, 175], "parameter": 159, "parti": [148, 171], "pendulum": [135, 142, 143], "perform": [9, 136, 178], "period": 161, "phoenix": 90, "pickl": 9, "pilot": 112, "pinbal": 121, "pitfal": [91, 159], "pitfall2": 92, "plai": 178, "plot": [177, 178], "pole": 132, "polici": [174, 177], "pong": 93, "poor": 163, "pooyan": 94, "practic": 161, "privat": 95, "problem": 159, "process": 163, "program": 158, "pusher": 144, "q": [163, 174, 175], "qbert": 96, "quadrup": 169, "question": 159, "quick": 160, "race": 128, "raid": 23, "random": [160, 178], "reacher": 145, "read": 160, "real": 159, "recommend": 165, "record": 161, "refer": [128, 131, 150, 151, 152, 154, 160, 175, 177, 178], "regist": [4, 159, 165], "reinforc": [158, 177], "releas": [155, 156], "remov": 160, "render": [9, 136, 159, 160, 165], "represent": 159, "reproduc": 136, "request": 0, "research": 159, "reset": [128, 159, 160, 165], "result": [163, 173], "reveng": [84, 124], "reward": [14, 19, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 159, 169], "rewardwrapp": 167, "rider": 35, "riverraid": 97, "rl": 158, "road": 98, "robot": [148, 169], "robotank": 99, "run": [173, 175], "runner": 98, "runtim": 9, "save": [9, 178], "seaquest": 100, "seed": [9, 160], "setup": [165, 169, 174, 178], "share": 13, "should": 160, "showcas": 178, "side": 160, "simpl": 159, "simul": 169, "sir": 101, "size": 175, "ski": 102, "slipperi": 152, "slow": 163, "solari": 103, "solut": [163, 165, 166], "solv": [174, 175], "space": [5, 6, 7, 8, 13, 104, 105, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159], "specif": 160, "speed": [162, 178], "split": 160, "standard": 3, "standup": 141, "star": 106, "start": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 159], "state": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 159, 165], "step": [1, 9, 158, 159, 160, 163, 165, 169], "strategi": 163, "stuck": 163, "subclass": 165, "summari": 161, "superman": 107, "surround": 108, "swimmer": 146, "synchron": 178, "syncvectorenv": 12, "system": 148, "tabl": [160, 175], "tabular": [174, 175], "tac": 111, "taxi": [154, 173], "telecommun": 148, "tenni": 109, "termin": [127, 128, 129, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 160, 166, 169], "test": [159, 160, 163], "tetri": 110, "text": 149, "thi": [87, 160], "think": [159, 174], "third": [148, 171], "tic": 111, "time": [112, 166, 175], "timelimit": 160, "tip": 159, "toe": 111, "toi": 149, "too": 163, "track": 161, "train": [136, 161, 162, 163, 169, 170, 172, 174, 176, 177, 178], "transit": [133, 134], "trondead": 113, "truncat": [135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 160, 166], "try": 178, "turmoil": 114, "tutankham": 115, "tutori": [1, 170, 171], "tweak": 169, "uncommon": 17, "understand": [158, 161, 163, 173], "unstabl": 163, "up": [116, 162, 178], "updat": 163, "us": [148, 159, 165, 171, 175, 177, 178], "usag": 158, "util": [5, 8, 9, 13], "v": 163, "v0": [155, 156, 160], "v1": [156, 160], "valid": 159, "variabl": 4, "vector": [5, 10, 13, 14, 20, 132, 162, 178], "vectorenv": 10, "ventur": 117, "version": [127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "video": [9, 118, 119, 120, 121, 148], "visual": [9, 173, 174, 175], "visualis": 174, "walk": [151, 152], "walker": 127, "walker2d": 147, "war": 105, "we": 175, "weight": 178, "what": [158, 163], "when": 161, "who": 160, "why": [158, 160, 161], "wizard": 122, "wor": 122, "word": 123, "work": 173, "world": 159, "wrapper": [14, 15, 16, 17, 18, 19, 20, 159, 160, 165, 167], "write": 1, "yar": 124, "you": [159, 174], "your": [158, 159, 160, 161, 163, 165, 169], "yourself": 178, "youtub": 171, "zapper": 123, "zaxxon": 125, "zone": 34}}) \ No newline at end of file diff --git a/tutorials/gymnasium_basics/README/index.html b/tutorials/gymnasium_basics/README/index.html index 8e8593e47..33004e68c 100644 --- a/tutorials/gymnasium_basics/README/index.html +++ b/tutorials/gymnasium_basics/README/index.html @@ -221,8 +221,7 @@
      • Create a Custom Environment
      • Recording Agents
      • Speeding Up Training
      • -
      • Compatibility with Gym
      • -
      • Migration Guide - v0.21 to v1.0.0
      • +
      • Gym Migration Guide

      API

        @@ -302,6 +301,10 @@
    • Training Agents

      API

        @@ -302,6 +301,10 @@
    • Training Agents

      API

        @@ -302,6 +301,10 @@
    • Training Agents

      API

        @@ -302,6 +301,10 @@
    • Training Agents

      API

        @@ -302,6 +301,10 @@
    • Training Agents

      API

        @@ -302,6 +301,10 @@
    • Training Agents

      API

        @@ -302,6 +301,10 @@
    • Training Agents

      API

        @@ -302,6 +301,10 @@
    • Training Agents

      API

        @@ -302,6 +301,10 @@
    • Training Agents
        +
      • Action Masking in the Taxi Environment
      • +
      • Running the Experiment
      • +
      • Visualizing Results
      • +
      • Results Analysis
      • Solving Blackjack with Tabular Q-Learning
      • Solving Frozenlake with Tabular Q-Learning
      • Training using REINFORCE for Mujoco
      • diff --git a/tutorials/training_agents/action_masking_taxi/index.html b/tutorials/training_agents/action_masking_taxi/index.html new file mode 100644 index 000000000..ddaf00b70 --- /dev/null +++ b/tutorials/training_agents/action_masking_taxi/index.html @@ -0,0 +1,1025 @@ + + + + + + + + + + + + + + + Action Masking in the Taxi Environment - Gymnasium Documentation + + + + + + + + + + + + + +
        +
        +
        + +
        + +
        +
        + + +
        +
        +
        +
        + + + + + + + + Contents + + + + + + Menu + + + + + + + + Expand + + + + + + Light mode + + + + + + + + + + + + + + Dark mode + + + + + + + Auto light/dark mode + + + + + + + + + + + + + + + + + +
        + + +
        + + + + + +
        +
        +
        + + + + + Back to top + +
        +
        + +
        + +
        +
        + +
        +

        Note

        +

        This tutorial is compatible with Gymnasium version 1.2.0.

        +
        +
        +

        Action Masking in the Taxi Environment

        +

        This tutorial demonstrates how to use action masking in the Taxi environment to improve reinforcement learning performance by preventing invalid actions.

        +

        The Taxi environment is a classic grid world problem where a taxi needs to pick up a passenger and drop them off at their destination. In this environment, not all actions are valid at every state - for example, you can’t drive through walls or pick up a passenger when you’re not at their location.

        +

        Action masking is a technique that helps reinforcement learning agents avoid selecting invalid actions by providing a binary mask that indicates which actions are valid in the current state. This can significantly improve learning efficiency and performance.

        +
        +

        Understanding the Taxi Environment

        +

        The Taxi environment has 6 possible actions:

        +
          +
        • 0: Move south (down)

        • +
        • 1: Move north (up)

        • +
        • 2: Move east (right)

        • +
        • 3: Move west (left)

        • +
        • 4: Pickup passenger

        • +
        • 5: Drop off passenger

        • +
        +

        The environment provides an action_mask in the info dictionary returned by reset() and step(). +This mask is a binary array where 1 indicates a valid action and 0 indicates an invalid action.

        +
        +
        +

        How Action Masking Works

        +

        Action masking works by constraining the agent’s action selection to only valid actions:

        +
          +
        1. During exploration: When selecting random actions, we only choose from the set of valid actions

        2. +
        3. During exploitation: When selecting the best action based on Q-values, we only consider Q-values for valid actions

        4. +
        5. During Q-learning updates: We compute the maximum future Q-value only over valid actions in the next state

        6. +
        +

        Let’s implement this step by step:

        +
        import random
        +from pathlib import Path
        +
        +import matplotlib.pyplot as plt
        +import numpy as np
        +
        +import gymnasium as gym
        +
        +
        +# Base random seed for reproducibility
        +BASE_RANDOM_SEED = 58922320
        +
        +
        +def train_q_learning(
        +    env,
        +    use_action_mask: bool = True,
        +    episodes: int = 5000,
        +    seed: int = BASE_RANDOM_SEED,
        +    learning_rate: float = 0.1,
        +    discount_factor: float = 0.95,
        +    epsilon: float = 0.1,
        +) -> dict:
        +    """Train a Q-learning agent with or without action masking."""
        +    # Set random seeds for reproducibility
        +    np.random.seed(seed)
        +    random.seed(seed)
        +
        +    # Initialize Q-table
        +    n_states = env.observation_space.n
        +    n_actions = env.action_space.n
        +    q_table = np.zeros((n_states, n_actions))
        +
        +    # Track episode rewards for analysis
        +    episode_rewards = []
        +
        +    for episode in range(episodes):
        +        # Reset environment
        +        state, info = env.reset(seed=seed + episode)
        +        total_reward = 0
        +        done = False
        +        truncated = False
        +
        +        while not (done or truncated):
        +            # Get action mask if using it
        +            action_mask = info["action_mask"] if use_action_mask else None
        +
        +            # Epsilon-greedy action selection with masking
        +            if np.random.random() < epsilon:
        +                # Random action selection
        +                if use_action_mask:
        +                    # Only select from valid actions
        +                    valid_actions = np.nonzero(action_mask == 1)[0]
        +                    action = np.random.choice(valid_actions)
        +                else:
        +                    # Select from all actions
        +                    action = np.random.randint(0, n_actions)
        +            else:
        +                # Greedy action selection
        +                if use_action_mask:
        +                    # Only consider valid actions for exploitation
        +                    valid_actions = np.nonzero(action_mask == 1)[0]
        +                    if len(valid_actions) > 0:
        +                        action = valid_actions[np.argmax(q_table[state, valid_actions])]
        +                    else:
        +                        action = np.random.randint(0, n_actions)
        +                else:
        +                    # Consider all actions
        +                    action = np.argmax(q_table[state])
        +
        +            # Take action and observe result
        +            next_state, reward, done, truncated, info = env.step(action)
        +            total_reward += reward
        +
        +            # Q-learning update
        +            if not (done or truncated):
        +                if use_action_mask:
        +                    # Only consider valid next actions for bootstrapping
        +                    next_mask = info["action_mask"]
        +                    valid_next_actions = np.nonzero(next_mask == 1)[0]
        +                    if len(valid_next_actions) > 0:
        +                        next_max = np.max(q_table[next_state, valid_next_actions])
        +                    else:
        +                        next_max = 0
        +                else:
        +                    # Consider all next actions
        +                    next_max = np.max(q_table[next_state])
        +
        +                # Update Q-value
        +                q_table[state, action] = q_table[state, action] + learning_rate * (
        +                    reward + discount_factor * next_max - q_table[state, action]
        +                )
        +
        +            state = next_state
        +
        +        episode_rewards.append(total_reward)
        +
        +    return {
        +        "episode_rewards": episode_rewards,
        +        "mean_reward": np.mean(episode_rewards),
        +        "std_reward": np.std(episode_rewards),
        +    }
        +
        +
        +
        +
        +
        +

        Running the Experiment

        +

        Now we’ll run experiments to compare the performance of Q-learning agents with and without action masking. +We’ll use multiple random seeds to ensure robust statistical comparison.

        +

        The experiment setup: +- 12 independent runs with different random seeds +- 5000 episodes per run +- Standard Q-learning hyperparameters (α=0.1, γ=0.95, ε=0.1)

        +
        # Experiment parameters
        +n_runs = 12
        +episodes = 5000
        +learning_rate = 0.1
        +discount_factor = 0.95
        +epsilon = 0.1
        +
        +# Generate different seeds for each run
        +seeds = [BASE_RANDOM_SEED + i for i in range(n_runs)]
        +
        +# Store results for comparison
        +masked_results_list = []
        +unmasked_results_list = []
        +
        +# Run experiments with different seeds
        +for i, seed in enumerate(seeds):
        +    print(f"Run {i + 1}/{n_runs} with seed {seed}")
        +
        +    # Train agent WITH action masking
        +    env_masked = gym.make("Taxi-v3")
        +    masked_results = train_q_learning(
        +        env_masked,
        +        use_action_mask=True,
        +        seed=seed,
        +        learning_rate=learning_rate,
        +        discount_factor=discount_factor,
        +        epsilon=epsilon,
        +        episodes=episodes,
        +    )
        +    env_masked.close()
        +    masked_results_list.append(masked_results)
        +
        +    # Train agent WITHOUT action masking
        +    env_unmasked = gym.make("Taxi-v3")
        +    unmasked_results = train_q_learning(
        +        env_unmasked,
        +        use_action_mask=False,
        +        seed=seed,
        +        learning_rate=learning_rate,
        +        discount_factor=discount_factor,
        +        epsilon=epsilon,
        +        episodes=episodes,
        +    )
        +    env_unmasked.close()
        +    unmasked_results_list.append(unmasked_results)
        +
        +
        +
        +
        +

        Visualizing Results

        +

        After running all experiments, we calculate statistics and create visualizations to compare the performance of both approaches.

        +
        # Calculate statistics across runs
        +masked_mean_rewards = [r["mean_reward"] for r in masked_results_list]
        +unmasked_mean_rewards = [r["mean_reward"] for r in unmasked_results_list]
        +
        +masked_overall_mean = np.mean(masked_mean_rewards)
        +masked_overall_std = np.std(masked_mean_rewards)
        +unmasked_overall_mean = np.mean(unmasked_mean_rewards)
        +unmasked_overall_std = np.std(unmasked_mean_rewards)
        +
        +# Create visualization
        +plt.figure(figsize=(12, 8), dpi=100)
        +
        +# Plot individual runs with low alpha
        +for i, (masked_results, unmasked_results) in enumerate(
        +    zip(masked_results_list, unmasked_results_list)
        +):
        +    plt.plot(
        +        masked_results["episode_rewards"],
        +        label="With Action Masking" if i == 0 else None,
        +        color="blue",
        +        alpha=0.1,
        +    )
        +    plt.plot(
        +        unmasked_results["episode_rewards"],
        +        label="Without Action Masking" if i == 0 else None,
        +        color="red",
        +        alpha=0.1,
        +    )
        +
        +# Calculate and plot mean curves across all runs
        +masked_mean_curve = np.mean([r["episode_rewards"] for r in masked_results_list], axis=0)
        +unmasked_mean_curve = np.mean(
        +    [r["episode_rewards"] for r in unmasked_results_list], axis=0
        +)
        +
        +plt.plot(
        +    masked_mean_curve, label="With Action Masking (Mean)", color="blue", linewidth=2
        +)
        +plt.plot(
        +    unmasked_mean_curve,
        +    label="Without Action Masking (Mean)",
        +    color="red",
        +    linewidth=2,
        +)
        +
        +plt.xlabel("Episode")
        +plt.ylabel("Total Reward")
        +plt.title("Training Performance: Q-Learning with vs without Action Masking")
        +plt.legend()
        +plt.grid(True, alpha=0.3)
        +
        +# Save the figure
        +savefig_folder = Path("_static/img/tutorials/")
        +savefig_folder.mkdir(parents=True, exist_ok=True)
        +plt.savefig(
        +    savefig_folder / "taxi_v3_action_masking_comparison.png",
        +    bbox_inches="tight",
        +    dpi=150,
        +)
        +plt.show()
        +
        +
        +../../../_images/taxi_v3_action_masking_comparison.png +
        +
        +

        Results Analysis

        +

        The comparison demonstrates several important benefits of using action masking:

        +

        Key Benefits of Action Masking:

        +

        1. Faster Convergence: Agents with action masking typically learn faster because they don’t waste time exploring +invalid actions.

        +
          +
        1. Better Performance: By focusing only on valid actions, the agent can achieve higher rewards more consistently.

        2. +
        3. More Stable Learning: Action masking reduces the variance in learning by eliminating the randomness associated with invalid action selection.

        4. +
        5. Practical Applicability: In real-world scenarios, action masking prevents agents from taking actions that could be dangerous or impossible.

        6. +
        +

        Reminder of Key Implementation Details

        +
          +
        • Action Selection: We filter available actions using np.nonzero(action_mask == 1)[0] to get only valid actions

        • +
        • Q-Value Updates: When computing the maximum future Q-value, we only consider valid actions in the next state

        • +
        • Exploration: Random action selection is constrained to the set of valid actions

        • +
        +

        This approach ensures that the agent never selects invalid actions while still maintaining the exploration-exploitation balance necessary for effective learning.

        + +
        + +
        +
        + +
        + +
        +
        +
        + + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/tutorials/training_agents/blackjack_q_learning/index.html b/tutorials/training_agents/blackjack_q_learning/index.html index b6a0c5ca1..81e3121a1 100644 --- a/tutorials/training_agents/blackjack_q_learning/index.html +++ b/tutorials/training_agents/blackjack_q_learning/index.html @@ -8,7 +8,7 @@ - + @@ -221,8 +221,7 @@
      • Create a Custom Environment
      • Recording Agents
      • Speeding Up Training
      • -
      • Compatibility with Gym
      • -
      • Migration Guide - v0.21 to v1.0.0
      • +
      • Gym Migration Guide

      API

        @@ -302,6 +301,10 @@
    • Training Agents
    -
    Training Agents
    +
    Action Masking in the Taxi Environment
    diff --git a/tutorials/training_agents/frozenlake_q_learning/index.html b/tutorials/training_agents/frozenlake_q_learning/index.html index ba8be3776..0d60d5409 100644 --- a/tutorials/training_agents/frozenlake_q_learning/index.html +++ b/tutorials/training_agents/frozenlake_q_learning/index.html @@ -221,8 +221,7 @@
  • Create a Custom Environment
  • Recording Agents
  • Speeding Up Training
  • -
  • Compatibility with Gym
  • -
  • Migration Guide - v0.21 to v1.0.0
  • +
  • Gym Migration Guide
  • API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents

    API

      @@ -302,6 +301,10 @@
  • Training Agents