mirror of
https://github.com/Farama-Foundation/Gymnasium.git
synced 2025-08-19 13:32:03 +00:00
1 line
233 KiB
JavaScript
1 line
233 KiB
JavaScript
Search.setIndex({"docnames": ["404", "README", "api/env", "api/experimental", "api/experimental/functional", "api/experimental/vector", "api/experimental/vector_wrappers", "api/experimental/wrappers", "api/registry", "api/spaces", "api/spaces/composite", "api/spaces/fundamental", "api/spaces/utils", "api/spaces/vector_utils", "api/utils", "api/vector", "api/wrappers", "api/wrappers/action_wrappers", "api/wrappers/misc_wrappers", "api/wrappers/observation_wrappers", "api/wrappers/reward_wrappers", "content/basic_usage", "content/gym_compatibility", "content/migration-guide", "environments/atari", "environments/atari/adventure", "environments/atari/air_raid", "environments/atari/alien", "environments/atari/amidar", "environments/atari/assault", "environments/atari/asterix", "environments/atari/asteroids", "environments/atari/atlantis", "environments/atari/bank_heist", "environments/atari/battle_zone", "environments/atari/beam_rider", "environments/atari/berzerk", "environments/atari/bowling", "environments/atari/boxing", "environments/atari/breakout", "environments/atari/carnival", "environments/atari/centipede", "environments/atari/chopper_command", "environments/atari/complete_list", "environments/atari/crazy_climber", "environments/atari/defender", "environments/atari/demon_attack", "environments/atari/double_dunk", "environments/atari/elevator_action", "environments/atari/enduro", "environments/atari/fishing_derby", "environments/atari/freeway", "environments/atari/frostbite", "environments/atari/gopher", "environments/atari/gravitar", "environments/atari/hero", "environments/atari/ice_hockey", "environments/atari/jamesbond", "environments/atari/journey_escape", "environments/atari/kangaroo", "environments/atari/krull", "environments/atari/kung_fu_master", "environments/atari/montezuma_revenge", "environments/atari/ms_pacman", "environments/atari/name_this_game", "environments/atari/phoenix", "environments/atari/pitfall", "environments/atari/pong", "environments/atari/pooyan", "environments/atari/private_eye", "environments/atari/qbert", "environments/atari/riverraid", "environments/atari/road_runner", "environments/atari/robotank", "environments/atari/seaquest", "environments/atari/skiing", "environments/atari/solaris", "environments/atari/space_invaders", "environments/atari/star_gunner", "environments/atari/tennis", "environments/atari/time_pilot", "environments/atari/tutankham", "environments/atari/up_n_down", "environments/atari/venture", "environments/atari/video_pinball", "environments/atari/wizard_of_wor", "environments/atari/zaxxon", "environments/box2d", "environments/box2d/bipedal_walker", "environments/box2d/car_racing", "environments/box2d/lunar_lander", "environments/classic_control", "environments/classic_control/acrobot", "environments/classic_control/cart_pole", "environments/classic_control/mountain_car", "environments/classic_control/mountain_car_continuous", "environments/classic_control/pendulum", "environments/mujoco", "environments/mujoco/ant", "environments/mujoco/half_cheetah", "environments/mujoco/hopper", "environments/mujoco/humanoid", "environments/mujoco/humanoid_standup", "environments/mujoco/inverted_double_pendulum", "environments/mujoco/inverted_pendulum", "environments/mujoco/pusher", "environments/mujoco/reacher", "environments/mujoco/swimmer", "environments/mujoco/walker2d", "environments/third_party_environments", "environments/toy_text", "environments/toy_text/blackjack", "environments/toy_text/cliff_walking", "environments/toy_text/frozen_lake", "environments/toy_text/taxi", "index", "release_notes/gym_v0.19.0", "release_notes/gym_v0.20.0", "release_notes/gym_v0.21.0", "release_notes/gym_v0.22.0", "release_notes/gym_v0.23.0", "release_notes/gym_v0.23.1", "release_notes/gym_v0.24.0", "release_notes/gym_v0.24.1", "release_notes/gym_v0.25.0", "release_notes/gym_v0.25.1", "release_notes/gym_v0.25.2", "release_notes/gym_v0.26.0", "release_notes/gym_v0.26.1", "release_notes/gym_v0.26.2", "release_notes/index", "tutorials/gymnasium_basics/README", "tutorials/gymnasium_basics/environment_creation", "tutorials/gymnasium_basics/handling_time_limits", "tutorials/gymnasium_basics/implementing_custom_wrappers", "tutorials/gymnasium_basics/index", "tutorials/gymnasium_basics/vector_envs_tutorial", "tutorials/index", "tutorials/training_agents/README", "tutorials/training_agents/blackjack_tutorial", "tutorials/training_agents/index", "tutorials/training_agents/reinforce_invpend_gym_v26"], "filenames": ["404.md", "README.md", "api/env.md", "api/experimental.md", "api/experimental/functional.md", "api/experimental/vector.md", "api/experimental/vector_wrappers.md", "api/experimental/wrappers.md", "api/registry.md", "api/spaces.md", "api/spaces/composite.md", "api/spaces/fundamental.md", "api/spaces/utils.md", "api/spaces/vector_utils.md", "api/utils.md", "api/vector.md", "api/wrappers.md", "api/wrappers/action_wrappers.md", "api/wrappers/misc_wrappers.md", "api/wrappers/observation_wrappers.md", "api/wrappers/reward_wrappers.md", "content/basic_usage.md", "content/gym_compatibility.md", "content/migration-guide.md", "environments/atari.md", "environments/atari/adventure.md", "environments/atari/air_raid.md", "environments/atari/alien.md", "environments/atari/amidar.md", "environments/atari/assault.md", "environments/atari/asterix.md", "environments/atari/asteroids.md", "environments/atari/atlantis.md", "environments/atari/bank_heist.md", "environments/atari/battle_zone.md", "environments/atari/beam_rider.md", "environments/atari/berzerk.md", "environments/atari/bowling.md", "environments/atari/boxing.md", "environments/atari/breakout.md", "environments/atari/carnival.md", "environments/atari/centipede.md", "environments/atari/chopper_command.md", "environments/atari/complete_list.md", "environments/atari/crazy_climber.md", "environments/atari/defender.md", "environments/atari/demon_attack.md", "environments/atari/double_dunk.md", "environments/atari/elevator_action.md", "environments/atari/enduro.md", "environments/atari/fishing_derby.md", "environments/atari/freeway.md", "environments/atari/frostbite.md", "environments/atari/gopher.md", "environments/atari/gravitar.md", "environments/atari/hero.md", "environments/atari/ice_hockey.md", "environments/atari/jamesbond.md", "environments/atari/journey_escape.md", "environments/atari/kangaroo.md", "environments/atari/krull.md", "environments/atari/kung_fu_master.md", "environments/atari/montezuma_revenge.md", "environments/atari/ms_pacman.md", "environments/atari/name_this_game.md", "environments/atari/phoenix.md", "environments/atari/pitfall.md", "environments/atari/pong.md", "environments/atari/pooyan.md", "environments/atari/private_eye.md", "environments/atari/qbert.md", "environments/atari/riverraid.md", "environments/atari/road_runner.md", "environments/atari/robotank.md", "environments/atari/seaquest.md", "environments/atari/skiing.md", "environments/atari/solaris.md", "environments/atari/space_invaders.md", "environments/atari/star_gunner.md", "environments/atari/tennis.md", "environments/atari/time_pilot.md", "environments/atari/tutankham.md", "environments/atari/up_n_down.md", "environments/atari/venture.md", "environments/atari/video_pinball.md", "environments/atari/wizard_of_wor.md", "environments/atari/zaxxon.md", "environments/box2d.md", "environments/box2d/bipedal_walker.md", "environments/box2d/car_racing.md", "environments/box2d/lunar_lander.md", "environments/classic_control.md", "environments/classic_control/acrobot.md", "environments/classic_control/cart_pole.md", "environments/classic_control/mountain_car.md", "environments/classic_control/mountain_car_continuous.md", "environments/classic_control/pendulum.md", "environments/mujoco.md", "environments/mujoco/ant.md", "environments/mujoco/half_cheetah.md", "environments/mujoco/hopper.md", "environments/mujoco/humanoid.md", "environments/mujoco/humanoid_standup.md", "environments/mujoco/inverted_double_pendulum.md", "environments/mujoco/inverted_pendulum.md", "environments/mujoco/pusher.md", "environments/mujoco/reacher.md", "environments/mujoco/swimmer.md", "environments/mujoco/walker2d.md", "environments/third_party_environments.md", "environments/toy_text.md", "environments/toy_text/blackjack.md", "environments/toy_text/cliff_walking.md", "environments/toy_text/frozen_lake.md", "environments/toy_text/taxi.md", "index.md", "release_notes/gym_v0.19.0.md", "release_notes/gym_v0.20.0.md", "release_notes/gym_v0.21.0.md", "release_notes/gym_v0.22.0.md", "release_notes/gym_v0.23.0.md", "release_notes/gym_v0.23.1.md", "release_notes/gym_v0.24.0.md", "release_notes/gym_v0.24.1.md", "release_notes/gym_v0.25.0.md", "release_notes/gym_v0.25.1.md", "release_notes/gym_v0.25.2.md", "release_notes/gym_v0.26.0.md", "release_notes/gym_v0.26.1.md", "release_notes/gym_v0.26.2.md", "release_notes/index.md", "tutorials/gymnasium_basics/README.rst", "tutorials/gymnasium_basics/environment_creation.rst", "tutorials/gymnasium_basics/handling_time_limits.rst", "tutorials/gymnasium_basics/implementing_custom_wrappers.rst", "tutorials/gymnasium_basics/index.rst", "tutorials/gymnasium_basics/vector_envs_tutorial.rst", "tutorials/index.rst", "tutorials/training_agents/README.rst", "tutorials/training_agents/blackjack_tutorial.rst", "tutorials/training_agents/index.rst", "tutorials/training_agents/reinforce_invpend_gym_v26.rst"], "titles": ["404 - Page Not Found", "Gymnasium-docs", "Env", "Experimental", "Functional Environment", "Vectorizing Environment", "Vector Environment Wrappers", "Wrappers", "Registry", "Spaces", "Composite Spaces", "Fundamental Spaces", "Spaces Utils", "Spaces Vector Utils", "Utils", "Vector", "Wrappers", "Action Wrappers", "Misc Wrappers", "Observation Wrappers", "Reward Wrappers", "Basic Usage", "Compatibility with Gym", "v21 to v26 Migration Guide", "Atari", "Adventure", "Air Raid", "Alien", "Amidar", "Assault", "Asterix", "Asteroids", "Atlantis", "Bank Heist", "Battle Zone", "Beam Rider", "Berzerk", "Bowling", "Boxing", "Breakout", "Carnival", "Centipede", "Chopper Command", "Complete List - Atari", "Crazy Climber", "Defender", "Demon Attack", "Double Dunk", "Elevator Action", "Enduro", "FishingDerby", "Freeway", "Frostbite", "Gopher", "Gravitar", "Hero", "IceHockey", "Jamesbond", "JourneyEscape", "Kangaroo", "Krull", "Kung Fu Master", "Montezuma Revenge", "Ms Pacman", "Name This Game", "Phoenix", "Pitfall", "Pong", "Pooyan", "PrivateEye", "Qbert", "Riverraid", "Road Runner", "Robot Tank", "Seaquest", "Skiings", "Solaris", "SpaceInvaders", "StarGunner", "Tennis", "TimePilot", "Tutankham", "Up n\u2019 Down", "Venture", "Video Pinball", "Wizard of Wor", "Zaxxon", "Box2D", "Bipedal Walker", "Car Racing", "Lunar Lander", "Classic Control", "Acrobot", "Cart Pole", "Mountain Car", "Mountain Car Continuous", "Pendulum", "MuJoCo", "Ant", "Half Cheetah", "Hopper", "Humanoid", "Humanoid Standup", "Inverted Double Pendulum", "Inverted Pendulum", "Pusher", "Reacher", "Swimmer", "Walker2D", "Third-party Environments", "Toy Text", "Blackjack", "Cliff Walking", "Frozen Lake", "Taxi", "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments", "v0.19.0 Release Notes", "v0.20.0 Release Notes", "v0.21.0 Release Notes", "v0.22 Release Notes", "v0.23.0 Release Notes", "v0.23.1 Release Notes", "v0.24.0 Release Notes", "v0.24.1 Release Notes", "v0.25.0 Release notes", "0.25.1 Release Notes", "v0.25.2 Release Notes", "v0.26.0 Release Notes", "v0.26.1 Release Notes", "v0.26.2 Release Notes", "Release Notes", "Gymnasium Basics", "Make your own custom environment", "Handling Time Limits", "Implementing Custom Wrappers", "Gymnasium Basics", "Training A2C with Vector Envs and Domain Randomization", "Tutorials", "Training Agents", "Solving Blackjack with Q-Learning", "Training Agents", "Training using REINFORCE for Mujoco"], "terms": {"thi": [1, 2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 115, 116, 117, 119, 120, 121, 122, 123, 124, 126, 127, 128, 129, 130, 132, 133, 134, 136, 139, 141], "folder": [1, 7, 14, 18, 105, 106, 130], "contain": [1, 2, 3, 7, 9, 12, 13, 15, 16, 18, 19, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 100, 101, 105, 106, 107, 108, 109, 111, 114, 117, 120, 121, 129, 130, 132, 136, 139, 141], "If": [1, 2, 3, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 30, 33, 38, 41, 50, 51, 52, 53, 54, 68, 75, 79, 88, 89, 90, 95, 98, 100, 101, 102, 106, 108, 111, 112, 113, 122, 127, 130, 132, 134, 136, 139], "you": [1, 2, 7, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 98, 101, 102, 105, 106, 109, 115, 117, 118, 122, 124, 127, 130, 132, 133, 134, 136], "ar": [1, 2, 3, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 117, 118, 119, 124, 126, 127, 129, 130, 132, 133, 134, 136, 139, 141], "pleas": [1, 2, 3, 14, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 117, 118, 124, 130], "pr": [1, 23, 109, 118, 122], "repo": [1, 24, 117, 130], "otherwis": [1, 2, 7, 8, 10, 11, 14, 15, 18, 19, 24, 37, 109, 124, 139], "follow": [1, 4, 7, 8, 9, 14, 18, 21, 24, 37, 47, 49, 50, 51, 52, 53, 54, 79, 92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 127, 130, 132, 133, 134, 139, 141], "below": [1, 11, 16, 21, 50, 88, 90, 96, 105, 108, 130, 133, 136, 139], "directli": [1, 7, 10, 16, 18, 21, 92, 109, 132, 139, 141], "markdown": 1, "file": [1, 92, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 119, 123, 124, 130, 132], "repositori": [1, 97, 122], "fork": [1, 23, 109, 115, 130], "docstr": [1, 123, 124, 125, 130], "": [1, 2, 3, 4, 7, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 24, 44, 50, 51, 52, 53, 54, 56, 57, 60, 61, 62, 67, 68, 70, 87, 88, 89, 90, 91, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 118, 119, 122, 127, 129, 130, 132, 133, 134, 136, 139, 141], "python": [1, 7, 8, 13, 18, 21, 88, 89, 90, 115, 119, 122, 124, 130, 132, 133, 134, 136, 137, 139, 141], "Then": [1, 16, 21, 74, 107, 134], "pip": [1, 24, 87, 91, 97, 118, 122, 130, 132], "instal": [1, 7, 14, 18, 32, 87, 91, 97, 116, 117, 118, 122, 128, 130, 132], "your": [1, 2, 3, 7, 9, 15, 16, 17, 18, 19, 20, 21, 27, 28, 30, 32, 33, 35, 37, 38, 39, 41, 47, 49, 50, 51, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 67, 69, 70, 71, 72, 73, 74, 75, 76, 77, 80, 81, 82, 83, 84, 85, 86, 89, 98, 101, 102, 115, 127, 130, 134, 135, 136, 137, 139], "run": [1, 2, 7, 8, 15, 18, 33, 55, 58, 66, 71, 72, 75, 76, 88, 90, 92, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 112, 118, 122, 132, 136], "script": [1, 139], "gen_md": 1, "py": [1, 13, 24, 88, 89, 90, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 112, 116, 117, 118, 121, 122, 123, 124, 125, 127, 128, 130, 132, 133, 134, 136, 139, 141], "automat": [1, 2, 3, 7, 8, 15, 16, 18, 22, 23, 119, 122, 124, 130, 132, 136], "gener": [1, 2, 7, 9, 10, 11, 14, 15, 16, 18, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 115, 116, 119, 127, 130, 132, 136], "For": [1, 2, 4, 7, 11, 12, 14, 18, 19, 21, 22, 23, 24, 25, 27, 28, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 45, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 89, 90, 97, 112, 113, 114, 122, 124, 126, 127, 130, 132, 134, 136, 139], "add": [1, 7, 8, 14, 15, 19, 21, 89, 97, 101, 102, 114, 117, 118, 121, 123, 124, 126, 129, 130, 132, 134, 136, 139], "complet": [1, 7, 18, 21, 23, 24, 44, 57, 69, 70, 89, 90, 130, 133, 134, 139], "ensur": [1, 2, 3, 8, 10, 12, 14, 21, 130, 132, 139], "i": [1, 2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 117, 118, 119, 122, 123, 124, 125, 126, 127, 128, 129, 130, 132, 133, 134, 136, 139, 141], "ha": [1, 2, 3, 7, 9, 11, 12, 14, 16, 18, 19, 20, 21, 23, 24, 54, 74, 88, 89, 90, 91, 97, 98, 99, 100, 101, 102, 105, 106, 107, 108, 109, 111, 115, 118, 119, 122, 124, 127, 128, 129, 130, 132, 133, 136, 139, 141], "properli": [1, 9, 117, 118], "format": [1, 9, 14, 16, 18, 19, 21, 130], "md": [1, 118, 130, 132], "correspond": [1, 2, 8, 16, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 93, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 114, 132, 136, 141], "gif": [1, 92], "_static": 1, "video": [1, 7, 16, 18, 43, 73, 88, 116, 117, 118, 124], "env_typ": 1, "where": [1, 3, 7, 8, 10, 11, 12, 14, 16, 18, 21, 23, 24, 47, 89, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 124, 128, 132, 133, 134, 136, 139, 141], "categori": 1, "e": [1, 2, 3, 7, 9, 11, 12, 13, 15, 16, 18, 19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 105, 106, 109, 111, 113, 117, 127, 130, 132, 134, 136, 139, 141], "g": [1, 2, 9, 11, 12, 13, 15, 19, 75, 92, 96, 109, 113, 114, 117, 124, 125, 132, 134, 136, 139, 141], "mujoco": [1, 16, 21, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 120, 122, 123, 124, 127, 128, 130, 134, 137, 140], "snake_cas": 1, "name": [1, 3, 4, 8, 16, 43, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 118, 119, 130, 132], "convent": [1, 2, 24], "altern": [1, 24], "gen_gif": 1, "index": [1, 7, 13, 14, 18, 19, 21, 24, 93, 102], "toctre": 1, "requir": [1, 2, 7, 9, 19, 97, 116, 119, 122, 124, 126, 130, 136, 139, 141], "packag": [1, 7, 18, 109, 119], "cd": [1, 132], "r": [1, 7, 11, 18, 20, 73, 92, 96, 109, 111, 112, 114, 134, 141], "txt": [1, 116], "To": [1, 7, 8, 13, 15, 16, 18, 19, 21, 22, 23, 24, 32, 42, 70, 88, 89, 90, 92, 114, 122, 132, 134, 136, 139, 141], "builder": 1, "onc": [1, 7, 18, 31, 41, 48, 55, 103, 106, 114, 127, 132, 136, 139], "make": [1, 2, 7, 10, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 117, 121, 122, 123, 124, 126, 127, 128, 130, 134, 135, 136, 137, 139, 141], "dirhtml": 1, "_build": 1, "rebuild": [1, 32], "everi": [1, 7, 9, 14, 18, 21, 41, 42, 46, 51, 73, 74, 83, 89, 90, 93, 98, 100, 101, 108, 109, 130, 132, 136, 141], "time": [1, 2, 7, 8, 10, 14, 15, 16, 18, 19, 23, 24, 40, 43, 46, 47, 48, 52, 56, 58, 59, 66, 70, 71, 72, 73, 74, 75, 88, 89, 96, 98, 99, 100, 101, 102, 107, 108, 109, 112, 114, 117, 118, 127, 132, 135, 136, 137, 139, 141], "chang": [1, 2, 3, 4, 7, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 52, 60, 70, 89, 92, 93, 94, 95, 96, 97, 105, 106, 109, 114, 116, 118, 121, 130, 132, 134, 139, 141], "made": [1, 3, 105, 106, 117, 118, 130], "sphinx": 1, "autobuild": 1, "b": [1, 11, 105, 106, 114], "we": [1, 2, 3, 4, 7, 11, 18, 19, 21, 23, 24, 98, 101, 102, 118, 122, 124, 126, 127, 130, 132, 133, 134, 136, 139, 141], "us": [1, 2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 113, 114, 116, 117, 118, 119, 122, 124, 125, 126, 127, 128, 130, 133, 134, 137, 139, 140], "galleri": [1, 130], "insid": [1, 10, 11, 18, 132], "directori": 1, "check": [1, 2, 7, 9, 11, 16, 18, 114, 122, 123, 130, 132, 134, 139], "demo": 1, "see": [1, 2, 9, 14, 15, 21, 23, 24, 25, 28, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 45, 55, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 90, 92, 98, 99, 100, 101, 107, 108, 109, 113, 117, 122, 124, 127, 130, 132, 136], "exampl": [1, 2, 7, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 89, 92, 111, 112, 113, 124, 128, 132, 133, 134, 136, 137, 139], "more": [1, 2, 3, 9, 10, 11, 14, 15, 16, 19, 23, 24, 25, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 45, 50, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88, 90, 97, 98, 101, 102, 103, 104, 105, 106, 107, 109, 122, 124, 127, 128, 130, 132, 133, 134, 136, 139, 141], "inform": [1, 2, 7, 9, 10, 11, 14, 15, 16, 18, 19, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 127, 132, 133, 139, 141], "convert": [1, 7, 8, 9, 10, 16, 18, 19, 22, 23, 89, 127, 130, 139], "jupyt": [1, 121, 132, 133, 134, 136, 137, 139, 141], "notebook": [1, 121, 132, 133, 134, 136, 137, 139, 141], "can": [1, 2, 3, 7, 8, 9, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 117, 118, 119, 122, 124, 126, 127, 129, 130, 132, 134, 136, 141], "want": [1, 2, 7, 10, 15, 16, 18, 21, 33, 55, 127, 130, 132, 134, 136, 139], "execut": [1, 7, 14, 17, 24, 47, 114, 132, 136, 141], "which": [1, 2, 7, 8, 9, 10, 12, 13, 14, 15, 18, 19, 20, 21, 22, 23, 24, 44, 46, 48, 62, 89, 90, 92, 93, 97, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 109, 112, 113, 114, 119, 121, 124, 127, 130, 132, 133, 134, 136, 141], "output": [1, 7, 13, 14, 18, 21, 127, 136, 139, 141], "plot": [1, 14, 139], "should": [1, 2, 3, 7, 9, 11, 14, 15, 18, 19, 21, 23, 105, 106, 116, 121, 122, 124, 130, 132, 134, 136, 139], "start": [1, 2, 7, 9, 11, 14, 15, 18, 34, 47, 48, 54, 58, 59, 74, 136, 139, 141], "run_": 1, "note": [1, 7, 9, 13, 18, 92, 93, 98, 101, 102, 114, 133, 136, 139, 141], "so": [1, 3, 7, 14, 15, 18, 19, 21, 24, 52, 75, 90, 91, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 113, 118, 127, 130, 132, 133, 134, 136, 139], "sure": [1, 2, 18, 132, 134], "doesn": [1, 2, 7, 8, 18, 24, 90, 133], "t": [1, 2, 3, 7, 8, 10, 12, 14, 16, 18, 19, 20, 23, 24, 40, 50, 51, 52, 53, 54, 73, 74, 89, 90, 94, 95, 114, 124, 127, 130, 132, 133, 136, 139], "take": [1, 2, 4, 7, 8, 11, 12, 14, 15, 17, 18, 21, 23, 24, 77, 91, 93, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 114, 127, 134, 136, 139, 141], "than": [1, 23, 50, 56, 74, 90, 92, 93, 94, 95, 99, 103, 104, 105, 107, 109, 111, 127, 136, 139], "few": [1, 92, 120, 121, 139], "second": [1, 7, 10, 14, 15, 37, 68, 75, 90, 99, 103, 106, 107], "class": [2, 4, 7, 10, 11, 14, 15, 16, 18, 21, 97, 119, 130, 132, 134, 136, 139, 141], "The": [2, 3, 4, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 115, 118, 119, 122, 124, 127, 130, 132, 133, 136, 139, 141], "main": [2, 90, 100, 108, 130], "reinforc": [2, 9, 21, 92, 107, 110, 111, 112, 114, 124, 130, 133, 136, 137, 139, 140], "learn": [2, 7, 9, 10, 18, 19, 20, 21, 24, 50, 51, 52, 53, 54, 88, 89, 90, 92, 93, 94, 95, 99, 102, 103, 104, 107, 110, 111, 112, 114, 119, 124, 132, 136, 137, 140], "agent": [2, 3, 7, 9, 18, 21, 23, 24, 48, 57, 88, 89, 90, 94, 98, 99, 100, 101, 102, 103, 104, 107, 108, 124, 128, 130, 132, 133, 134], "encapsul": 2, "an": [2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 105, 106, 107, 108, 109, 111, 112, 113, 114, 118, 122, 124, 125, 128, 130, 132, 133, 134, 136], "arbitrari": [2, 8, 11, 14, 19, 20, 109, 136], "behind": [2, 68, 130], "scene": [2, 68, 109, 130], "dynam": [2, 24, 39, 50, 51, 52, 53, 54, 92, 96, 97, 103, 124], "through": [2, 7, 8, 9, 15, 22, 23, 24, 39, 55, 58, 61, 62, 66, 75, 76, 101, 102, 116, 122, 124, 127, 130, 133], "step": [2, 7, 8, 15, 16, 17, 18, 19, 20, 21, 24, 88, 90, 92, 93, 96, 112, 113, 114, 115, 118, 119, 122, 123, 124, 126, 127, 129, 130, 133, 134, 136, 139, 141], "reset": [2, 7, 8, 14, 15, 16, 17, 18, 19, 20, 21, 92, 93, 94, 95, 96, 109, 112, 113, 114, 115, 118, 119, 122, 123, 124, 125, 127, 129, 130, 136, 139, 141], "function": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 90, 96, 98, 106, 109, 113, 114, 117, 119, 122, 124, 126, 127, 130, 133, 134, 136, 139, 141], "partial": [2, 124], "fulli": [2, 117], "observ": [2, 4, 9, 10, 13, 14, 15, 16, 17, 18, 20, 23, 109, 115, 117, 122, 123, 124, 125, 127, 128, 129, 130, 133, 134, 141], "singl": [2, 4, 7, 9, 10, 11, 12, 13, 14, 15, 19, 21, 100, 101, 102, 108, 124, 127, 132, 141], "multi": [2, 11, 97, 101, 102, 105], "pettingzoo": [2, 116, 117], "api": [2, 4, 7, 16, 18, 21, 23, 116, 122, 125, 126, 127, 128, 130, 132, 133, 136], "user": [2, 3, 4, 8, 15, 21, 23, 24, 92, 93, 94, 95, 96, 109, 125, 126, 127, 130, 132, 141], "need": [2, 8, 9, 10, 14, 16, 17, 18, 19, 21, 23, 42, 44, 49, 55, 59, 69, 74, 88, 90, 93, 97, 118, 124, 132, 133, 134, 136, 139], "know": [2, 3, 18, 21, 130, 132], "updat": [2, 7, 14, 18, 19, 21, 22, 23, 114, 116, 124, 127, 128, 129, 130, 132, 133, 134, 136, 139, 141], "action": [2, 4, 8, 9, 10, 11, 14, 15, 16, 18, 23, 43, 91, 109, 110, 115, 118, 119, 123, 124, 127, 130, 132, 134, 136, 141], "return": [2, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 112, 113, 114, 119, 123, 124, 127, 129, 130, 132, 133, 134, 136, 139, 141], "next": [2, 4, 13, 21, 23, 44, 46, 48, 141], "reward": [2, 4, 8, 14, 15, 16, 18, 21, 23, 97, 109, 115, 116, 124, 127, 130, 132, 133, 134, 136, 139, 141], "termin": [2, 4, 7, 8, 14, 15, 16, 18, 20, 21, 22, 23, 92, 93, 94, 95, 98, 100, 101, 102, 103, 104, 105, 106, 108, 111, 112, 113, 114, 115, 124, 126, 127, 132, 134, 136, 139, 141], "truncat": [2, 7, 8, 14, 15, 16, 18, 20, 21, 22, 23, 92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 113, 114, 115, 124, 126, 127, 128, 130, 132, 134, 136, 139, 141], "due": [2, 23, 113, 124, 125, 126, 133, 136], "latest": [2, 141], "from": [2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 26, 40, 47, 52, 53, 56, 58, 67, 68, 80, 86, 88, 89, 90, 92, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 117, 119, 123, 124, 127, 128, 130, 133, 136, 139, 141], "about": [2, 4, 14, 19, 21, 69, 92, 98, 101, 102, 132, 133, 139, 141], "metric": [2, 14, 23, 130, 136], "debug": [2, 9, 14, 110, 126], "info": [2, 4, 7, 14, 15, 16, 18, 20, 21, 23, 98, 99, 100, 101, 105, 106, 107, 108, 114, 115, 119, 122, 124, 126, 127, 129, 130, 132, 133, 134, 136, 139, 141], "initi": [2, 4, 7, 8, 10, 11, 15, 16, 17, 18, 19, 20, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 124, 127, 134, 136, 139, 141], "state": [2, 4, 7, 16, 18, 19, 21, 23, 24, 91, 97, 109, 110, 124, 126, 133, 136, 139, 141], "befor": [2, 7, 8, 14, 15, 16, 17, 18, 19, 20, 32, 44, 58, 69, 76, 77, 89, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 118, 119, 122, 124, 130, 132, 134, 141], "call": [2, 7, 8, 12, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 37, 56, 105, 106, 111, 113, 118, 122, 123, 124, 132, 136, 139], "first": [2, 14, 15, 16, 18, 19, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 118, 123, 130, 132, 139, 141], "episod": [2, 7, 8, 14, 16, 18, 19, 23, 127, 132, 133, 136, 139, 141], "render": [2, 4, 15, 16, 18, 19, 21, 24, 87, 88, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 117, 119, 120, 122, 123, 124, 125, 126, 127, 128, 129, 130, 134, 139], "help": [2, 9, 21, 27, 59, 62, 105, 122, 127, 130, 136, 139], "visualis": [2, 21], "what": [2, 9, 18, 24, 112, 130], "mode": [2, 15, 16, 18, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 124, 127, 130, 132, 136, 139], "human": [2, 7, 10, 16, 18, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 101, 102, 105, 115, 124, 127, 130, 132, 136], "rgb_arrai": [2, 7, 14, 16, 18, 19, 24, 124, 127, 132, 136], "ansi": [2, 127, 132], "text": [2, 9, 10, 12, 21, 111, 112, 113, 114, 117, 124, 127], "close": [2, 4, 11, 14, 15, 16, 21, 23, 44, 69, 98, 100, 101, 106, 108, 115, 117, 123, 127, 130, 134, 136, 139], "import": [2, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 122, 124, 127, 132, 134, 136, 141], "when": [2, 3, 7, 9, 10, 12, 13, 14, 15, 16, 18, 19, 22, 24, 27, 40, 44, 45, 46, 48, 50, 51, 52, 53, 54, 56, 57, 71, 72, 73, 74, 77, 89, 90, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 112, 113, 114, 117, 118, 119, 122, 124, 126, 129, 130, 132, 133, 134, 136, 141], "extern": [2, 23, 98, 101, 102, 127, 133], "softwar": [2, 109], "pygam": [2, 14, 23, 87, 119, 121, 122, 132], "databas": 2, "have": [2, 7, 8, 9, 11, 12, 15, 16, 17, 18, 20, 21, 22, 23, 24, 25, 27, 30, 32, 33, 37, 39, 41, 42, 44, 45, 50, 51, 52, 53, 54, 55, 58, 59, 60, 64, 66, 68, 74, 76, 87, 88, 89, 92, 98, 99, 100, 101, 102, 104, 105, 107, 108, 109, 111, 113, 114, 118, 119, 122, 124, 127, 130, 132, 133, 134, 136, 139, 141], "understand": [2, 12, 15, 105, 109, 141], "action_spac": [2, 7, 9, 14, 15, 16, 17, 19, 20, 21, 23, 114, 115, 132, 134, 139, 141], "space": [2, 3, 7, 14, 15, 16, 17, 18, 19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 97, 109, 110, 116, 117, 118, 119, 122, 123, 124, 125, 126, 128, 130, 132, 134, 136, 141], "object": [2, 9, 13, 16, 21, 25, 30, 44, 50, 51, 59, 71, 77, 105, 139, 141], "valid": [2, 7, 8, 9, 11, 13, 15, 16, 17, 18, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 136, 139], "all": [2, 3, 7, 9, 10, 11, 15, 16, 18, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 51, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 89, 90, 91, 92, 93, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 116, 117, 119, 124, 126, 127, 130, 134, 136, 137, 139, 141], "within": [2, 7, 9, 17, 19, 21, 23, 62, 66, 90, 91, 103, 104, 127, 129, 130], "observation_spac": [2, 7, 9, 10, 11, 15, 16, 19, 21, 132, 134, 141], "reward_rang": [2, 16, 20, 134], "A": [2, 4, 7, 9, 10, 11, 12, 14, 15, 17, 18, 19, 20, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 92, 93, 95, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 112, 113, 118, 124, 125, 127, 130, 132, 133, 134, 136, 139, 141], "tupl": [2, 4, 7, 9, 11, 12, 13, 14, 16, 19, 21, 23, 24, 98, 100, 101, 108, 111, 117, 126, 132, 136, 139, 141], "minimum": [2, 7, 11, 96], "maximum": [2, 7, 8, 11, 14, 18, 21, 73, 74, 90, 92, 96, 103, 132, 136], "possibl": [2, 9, 10, 11, 12, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 93, 94, 95, 99, 101, 103, 104, 107, 108, 109, 112, 113, 114, 127, 132, 139], "over": [2, 7, 13, 18, 27, 33, 56, 66, 71, 99, 101, 111, 113, 119, 126, 127, 134, 136, 139], "default": [2, 7, 8, 9, 10, 11, 14, 15, 16, 18, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 92, 96, 98, 99, 100, 101, 105, 106, 107, 108, 119, 122, 124, 127, 132, 133], "rang": [2, 7, 13, 14, 16, 17, 18, 20, 21, 22, 23, 24, 56, 88, 91, 92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 132, 134, 136, 139, 141], "set": [2, 7, 9, 10, 11, 15, 17, 18, 19, 23, 24, 25, 26, 27, 28, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 83, 84, 85, 87, 90, 91, 92, 94, 95, 97, 98, 99, 100, 101, 105, 106, 107, 108, 109, 113, 119, 122, 124, 127, 132, 133, 134, 136, 139, 141], "infti": [2, 11], "spec": [2, 15, 16, 18], "metadata": [2, 7, 14, 16, 18, 24, 120, 125, 126, 130, 132, 134], "fp": [2, 7, 14, 24, 132], "np_random": [2, 14, 16, 18, 23, 123, 127, 130, 132], "random": [2, 7, 9, 10, 11, 14, 18, 19, 21, 24, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 106, 107, 108, 109, 113, 114, 119, 124, 127, 130, 132, 135, 137, 139, 141], "number": [2, 3, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 21, 22, 24, 26, 27, 28, 29, 30, 31, 32, 35, 36, 37, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 58, 61, 63, 64, 65, 67, 68, 70, 73, 75, 77, 78, 80, 81, 82, 84, 85, 89, 90, 92, 100, 101, 102, 107, 108, 109, 111, 113, 119, 124, 127, 130, 132, 136, 141], "assign": [2, 75, 93, 94, 95, 105, 106, 139], "dure": [2, 7, 10, 11, 15, 18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 98, 99, 100, 101, 107, 108, 114, 119, 123, 124, 127, 132, 134], "super": [2, 16, 23, 116, 127, 132, 134, 136, 141], "seed": [2, 7, 8, 9, 10, 11, 13, 15, 16, 17, 19, 21, 72, 115, 117, 119, 122, 126, 127, 130, 132, 136, 141], "assess": 2, "self": [2, 4, 7, 9, 10, 16, 17, 18, 19, 20, 95, 109, 132, 134, 136, 139, 141], "modifi": [2, 7, 9, 15, 16, 17, 19, 20, 23, 92, 105, 106, 114, 119, 122, 124, 130, 132, 134], "extend": [2, 98], "wrapper": [2, 8, 10, 11, 14, 15, 21, 22, 105, 106, 109, 113, 114, 115, 117, 118, 120, 122, 123, 124, 125, 126, 127, 129, 130, 135, 136, 137, 139, 141], "acttyp": [2, 4, 7, 14, 16, 17, 19, 20], "obstyp": [2, 4, 7, 14, 16, 17, 19, 20, 23, 141], "supportsfloat": [2, 7, 8, 11, 16, 20, 23, 134, 141], "bool": [2, 7, 8, 9, 11, 14, 15, 16, 18, 19, 23, 24, 90, 98, 99, 100, 101, 107, 108, 132, 139, 141], "dict": [2, 4, 7, 8, 9, 11, 12, 13, 14, 15, 16, 18, 19, 21, 23, 112, 113, 114, 117, 118, 125, 126, 132, 141], "str": [2, 4, 7, 8, 9, 10, 11, 12, 14, 15, 16, 18, 19, 23, 24, 98, 99, 100, 101, 107, 108, 139, 141], "ani": [2, 4, 7, 8, 9, 10, 11, 12, 13, 14, 16, 18, 19, 23, 24, 46, 50, 51, 52, 53, 54, 55, 73, 90, 93, 98, 100, 101, 102, 103, 104, 105, 106, 107, 108, 113, 127, 132, 133, 139, 141], "one": [2, 10, 11, 12, 14, 15, 16, 18, 19, 21, 22, 23, 26, 27, 28, 32, 37, 44, 47, 48, 60, 69, 70, 71, 73, 74, 79, 92, 93, 94, 95, 96, 98, 100, 102, 103, 104, 106, 107, 111, 114, 119, 127, 133, 134, 136, 139, 141], "timestep": [2, 7, 18, 19, 21, 94, 95, 98, 100, 101, 102, 103, 104, 105, 106, 108, 132, 136, 141], "end": [2, 4, 7, 16, 18, 21, 32, 41, 42, 44, 46, 48, 49, 57, 58, 59, 69, 73, 76, 77, 88, 96, 124, 133, 139, 141], "reach": [2, 7, 16, 23, 32, 34, 44, 47, 48, 65, 68, 76, 77, 91, 92, 93, 94, 95, 98, 100, 101, 102, 103, 104, 105, 106, 108, 112, 113, 114, 132, 133, 139, 141], "necessari": [2, 9, 24, 50, 51, 52, 53, 54, 122, 127, 128], "version": [2, 3, 8, 9, 16, 93, 116, 117, 118, 119, 122, 123, 124, 127, 130, 132, 133, 136, 139], "0": [2, 3, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 119, 121, 123, 126, 128, 129, 132, 133, 134, 136, 139, 141], "26": [2, 22, 98, 101, 102, 132, 133, 141], "wa": [2, 7, 14, 15, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 100, 101, 107, 108, 118, 122, 124, 127, 128, 129, 130, 133, 134, 136, 141], "remov": [2, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 98, 114, 116, 117, 119, 120, 121, 122, 123, 124, 125, 126, 127, 130], "done": [2, 8, 14, 16, 18, 21, 22, 23, 98, 100, 101, 102, 103, 104, 108, 122, 124, 126, 132, 133, 136, 139, 141], "favor": [2, 117, 119, 130], "clearer": [2, 118], "had": [2, 118], "critic": [2, 3, 18, 130], "bootstrap": [2, 23, 133], "algorithm": [2, 9, 97, 110, 114, 117, 124, 133, 136, 139, 141], "paramet": [2, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 107, 108, 122, 124, 127, 132, 134, 136, 141], "provid": [2, 3, 7, 9, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 24, 30, 44, 46, 50, 51, 52, 53, 54, 88, 92, 109, 127, 130, 132, 139], "element": [2, 7, 9, 10, 11, 13, 15, 19, 21, 93, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 132, 136], "numpi": [2, 3, 4, 7, 9, 11, 13, 15, 16, 17, 19, 23, 109, 116, 130, 132, 134, 136, 139, 141], "arrai": [2, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 90, 109, 125, 127, 128, 130, 132, 134, 136, 139, 141], "posit": [2, 7, 10, 11, 12, 13, 14, 18, 21, 24, 35, 56, 88, 89, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 112, 113, 114, 132, 134, 139], "veloc": [2, 10, 12, 13, 88, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "pole": [2, 75, 91, 103, 104, 109, 141], "cartpol": [2, 7, 8, 14, 15, 18, 19, 20, 21, 91, 93, 103, 104, 109, 127, 141], "result": [2, 3, 12, 14, 15, 21, 92, 98, 101, 102, 110, 112, 114, 124, 130, 136, 139], "whether": [2, 4, 7, 8, 9, 11, 14, 18, 23, 37, 90, 98, 99, 100, 101, 107, 108, 111, 132, 133, 139, 141], "defin": [2, 4, 7, 9, 12, 17, 18, 19, 20, 21, 96, 101, 132, 133, 134, 136], "under": [2, 7, 19, 20, 139, 141], "mdp": [2, 18, 21, 94, 95], "task": [2, 10, 16, 21, 60, 66, 69, 89, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 114, 132, 133, 134, 141], "neg": [2, 11, 14, 21, 75, 95, 98, 99, 101, 102, 103, 105, 106, 114, 141], "goal": [2, 27, 30, 35, 37, 39, 41, 44, 56, 61, 62, 63, 64, 65, 67, 70, 72, 74, 75, 81, 82, 83, 84, 85, 86, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 132, 141], "move": [2, 3, 7, 16, 20, 21, 23, 26, 29, 30, 39, 40, 54, 57, 68, 71, 74, 75, 88, 90, 93, 98, 99, 100, 102, 103, 104, 105, 106, 107, 108, 109, 112, 113, 114, 116, 117, 119, 120, 128, 130, 132, 133, 141], "lava": [2, 21, 55], "sutton": [2, 92, 93, 103, 104, 111, 112, 117, 139], "barton": 2, "gridworld": [2, 109, 112, 132], "true": [2, 7, 8, 12, 14, 15, 17, 18, 19, 21, 22, 23, 24, 50, 51, 52, 53, 54, 88, 89, 90, 98, 99, 100, 101, 107, 108, 111, 113, 119, 122, 124, 126, 127, 130, 132, 136, 139, 141], "condit": [2, 133, 139, 141], "outsid": [2, 7, 89, 90, 117, 133], "scope": [2, 133], "satisfi": 2, "typic": [2, 14, 114], "timelimit": [2, 8, 16, 18, 21, 126, 132, 133], "could": [2, 3, 14, 21, 24, 130, 132, 133, 134, 136, 139, 141], "also": [2, 7, 8, 11, 14, 15, 16, 18, 19, 21, 24, 36, 57, 58, 69, 70, 72, 88, 89, 90, 91, 97, 98, 99, 100, 101, 107, 108, 109, 118, 124, 127, 132, 133, 134, 136, 139, 141], "indic": [2, 7, 14, 18, 23, 89, 92, 93, 98, 101, 102, 111, 112, 113, 114, 122, 133, 139, 141], "physic": [2, 87, 97, 103, 104, 118, 130, 141], "go": [2, 48, 75, 79, 89, 111, 127, 133, 136, 139, 141], "out": [2, 4, 13, 16, 24, 33, 38, 55, 58, 66, 71, 76, 127, 130, 132, 133, 134, 141], "bound": [2, 7, 11, 16, 17, 21, 23, 90, 92, 93, 94, 95, 96, 122, 124, 125, 133], "prematur": 2, "auxiliari": [2, 132], "diagnost": 2, "log": [2, 136, 141], "might": [2, 9, 11, 12, 16, 17, 18, 20, 23, 132, 134, 136, 139, 141], "instanc": [2, 4, 7, 8, 9, 10, 12, 13, 14, 15, 18, 21, 109, 134, 136], "describ": [2, 9, 10, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 93, 107, 111, 118, 130, 134], "perform": [2, 3, 7, 9, 14, 18, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 106, 109, 117, 122, 130, 141], "variabl": [2, 7, 9, 11, 15, 18, 98, 100, 107, 108, 109, 120, 132, 133, 139, 141], "hidden": [2, 97, 141], "individu": [2, 3, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 124, 132, 134, 141], "term": [2, 91, 92, 97, 98, 99, 100, 101, 105, 106, 107, 108, 132, 134, 136], "combin": [2, 9, 14, 16, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 106, 136], "produc": [2, 7, 16, 18, 102, 122, 132], "total": [2, 44, 88, 89, 90, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 114, 136, 141], "In": [2, 3, 7, 11, 14, 15, 16, 17, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 91, 92, 98, 99, 100, 101, 107, 108, 114, 124, 127, 130, 132, 133, 134, 136, 139, 141], "openai": [2, 8, 15, 16, 21, 23, 87, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 133, 139, 141], "gym": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 87, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 132, 133, 134, 136, 139, 141], "v26": [2, 130, 141], "distinguish": [2, 132, 133], "howev": [2, 3, 7, 8, 9, 10, 11, 12, 15, 17, 18, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 98, 99, 100, 101, 105, 106, 122, 130, 132, 133, 134, 136, 139], "deprec": [2, 117, 119, 120, 121, 124, 130], "favour": [2, 22, 23, 124, 126, 130], "boolean": [2, 7, 9, 14, 18, 23, 90, 139, 141], "valu": [2, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 21, 23, 24, 74, 88, 90, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 122, 124, 127, 133, 136, 139, 141], "case": [2, 4, 7, 9, 10, 11, 17, 19, 21, 23, 57, 69, 89, 98, 99, 100, 101, 107, 108, 114, 132, 133, 134, 136, 141], "further": [2, 23, 74, 90, 105, 106, 124, 141], "undefin": 2, "signal": [2, 7, 16, 18, 21, 98, 100, 101, 108, 114, 132, 133], "mai": [2, 7, 9, 11, 12, 14, 15, 16, 17, 18, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 100, 101, 107, 108, 113, 132, 136], "emit": [2, 16, 18], "differ": [2, 9, 10, 14, 15, 17, 18, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 96, 98, 99, 100, 101, 102, 103, 104, 108, 109, 124, 128, 132, 133, 134, 136], "reason": [2, 7, 23, 90, 124], "mayb": 2, "underli": [2, 16, 18, 21, 92], "solv": [2, 88, 91, 93, 97, 103, 104, 132, 137, 140, 141], "successfulli": [2, 114], "certain": [2, 47, 49, 103, 104, 106, 124, 136, 139], "exceed": [2, 16, 18, 21, 98, 100, 101, 108, 139], "simul": [2, 24, 50, 51, 52, 53, 54, 97, 101, 102, 103, 104, 139, 141], "enter": [2, 14, 31, 33, 60, 90, 112], "invalid": [2, 11, 139], "int": [2, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 24, 111, 112, 113, 114, 130, 132, 136, 139, 141], "none": [2, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 23, 113, 124, 130, 132, 136, 139], "option": [2, 4, 7, 8, 9, 10, 11, 14, 15, 16, 18, 19, 21, 23, 89, 92, 93, 94, 95, 96, 119, 122, 124, 132], "intern": [2, 4, 15, 19, 127], "new": [2, 3, 7, 9, 16, 17, 18, 19, 21, 22, 23, 28, 31, 33, 46, 92, 93, 94, 95, 96, 98, 106, 109, 114, 118, 119, 122, 123, 124, 125, 126, 127, 130, 132, 133, 134, 136, 139], "often": [2, 9, 97, 132], "some": [2, 9, 10, 11, 15, 16, 18, 21, 23, 24, 40, 48, 66, 89, 91, 92, 97, 106, 107, 114, 127, 132, 134, 136, 139], "explor": [2, 9, 54, 109, 130, 136, 139], "generalis": 2, "polici": [2, 7, 19, 20, 21, 23, 91, 97, 98, 99, 100, 101, 102, 107, 108, 109, 115, 118, 133, 136], "control": [2, 9, 11, 21, 23, 24, 26, 29, 31, 32, 33, 34, 35, 40, 42, 45, 52, 53, 54, 57, 59, 66, 67, 69, 71, 72, 73, 74, 75, 76, 79, 80, 87, 89, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 117, 119, 122, 124, 130, 134, 136], "alreadi": [2, 3, 16, 19, 21, 130], "rng": [2, 4, 9, 10, 11, 119, 132], "therefor": [2, 3, 7, 9, 15, 23, 122, 126, 127, 130], "right": [2, 11, 24, 26, 28, 29, 30, 31, 35, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 59, 61, 63, 64, 65, 67, 70, 75, 77, 78, 80, 81, 84, 85, 88, 89, 90, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 107, 108, 112, 113, 114, 132, 139, 141], "after": [2, 4, 7, 8, 14, 15, 18, 19, 21, 32, 36, 41, 47, 51, 55, 77, 90, 98, 99, 100, 101, 102, 107, 108, 111, 114, 124, 132, 133, 136, 139, 141], "never": 2, "again": [2, 90, 132], "custom": [2, 7, 9, 14, 15, 16, 19, 21, 23, 24, 50, 51, 52, 53, 54, 107, 109, 113, 116, 126, 135, 137], "line": [2, 9, 23, 47, 92, 114, 117, 132], "correctli": [2, 7, 19, 20, 121, 122, 126, 132], "v0": [2, 3, 8, 14, 16, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 132, 133, 141], "25": [2, 12, 24, 50, 51, 52, 53, 54, 98, 100, 101, 102, 108, 114, 127, 130], "return_info": [2, 119, 124, 127], "now": [2, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 116, 117, 118, 119, 121, 122, 123, 124, 127, 129, 130, 132, 133, 139, 141], "expect": [2, 3, 9, 10, 11, 15, 18, 21, 117, 127, 130, 136, 141], "prng": [2, 9, 10, 11], "doe": [2, 7, 8, 10, 12, 14, 15, 18, 22, 36, 52, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 117, 130, 132, 133, 134, 136], "pass": [2, 4, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 90, 98, 99, 100, 101, 107, 108, 119, 122, 132, 134, 136], "chosen": [2, 11, 24, 136], "sourc": [2, 97, 109, 119, 132, 133, 134, 136, 137, 139, 141], "entropi": [2, 136], "timestamp": 2, "dev": [2, 124, 127, 141], "urandom": 2, "integ": [2, 7, 10, 11, 12, 14, 18, 19, 23, 24, 119, 126, 130, 132], "even": [2, 8, 25, 27, 33, 34, 36, 38, 41, 42, 45, 55, 56, 57, 59, 60, 62, 66, 69, 71, 72, 73, 74, 76, 79, 83, 86, 102, 128, 132, 139], "exist": [2, 8, 9, 15, 16, 21, 130, 136], "usual": [2, 7, 10, 11, 18, 24, 50, 51, 52, 53, 54, 56, 100, 132, 134, 136, 139], "been": [2, 14, 18, 21, 23, 98, 101, 102, 109, 118, 119, 122, 124, 127, 128, 130, 132, 133], "refer": [2, 14, 18, 21, 23, 132, 133], "minim": [2, 132, 133, 136, 141], "abov": [2, 3, 10, 11, 14, 22, 23, 24, 50, 51, 52, 53, 54, 92, 93, 96, 97, 130, 136, 141], "paradigm": 2, "specifi": [2, 7, 9, 10, 11, 14, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 90, 91, 96, 100, 101, 105, 106, 108, 110, 113, 114, 124, 128, 129, 130, 132, 134], "how": [2, 9, 14, 15, 21, 56, 58, 59, 102, 103, 105, 106, 132, 133, 134, 136, 139, 141], "depend": [2, 7, 10, 14, 19, 20, 24, 26, 27, 28, 29, 30, 31, 32, 35, 36, 37, 39, 40, 42, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 59, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 87, 91, 93, 97, 98, 99, 100, 101, 107, 108, 109, 113, 116, 117, 121, 123, 126, 130, 136], "specif": [2, 7, 8, 11, 18, 126, 133, 136, 141], "analog": [2, 24], "dictionari": [2, 7, 9, 10, 14, 15, 16, 18, 19, 21, 23, 122, 126, 132, 134, 139, 141], "complement": 2, "It": [2, 7, 8, 10, 11, 14, 15, 18, 21, 24, 25, 26, 27, 28, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 83, 84, 85, 88, 97, 98, 99, 100, 101, 102, 105, 106, 107, 108, 109, 127, 130, 132, 139, 141], "renderfram": [2, 14], "list": [2, 3, 7, 8, 9, 10, 11, 14, 15, 16, 18, 19, 21, 24, 116, 118, 122, 124, 127, 130, 136, 139], "comput": [2, 14, 67, 79, 98, 103, 105, 106, 109, 126, 132, 136, 139], "frame": [2, 7, 14, 18, 19, 24, 37, 89, 90, 102, 105, 124, 127], "render_mod": [2, 7, 14, 15, 16, 18, 19, 21, 23, 24, 115, 124, 126, 127, 128, 129, 130, 132, 136], "wai": [2, 10, 16, 21, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 118, 133, 134, 136, 139], "most": [2, 7, 9, 16, 18, 19, 21, 23, 24, 50, 51, 52, 53, 54, 106, 119, 122, 132, 134, 139], "achiev": [2, 24, 27, 92, 111, 127, 136], "appli": [2, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 88, 90, 91, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 122, 127, 132, 134, 139, 141], "collect": [2, 3, 7, 15, 18, 27, 30, 48, 62, 63, 66, 82, 109, 136, 139], "As": [2, 3, 15, 16, 18, 21, 80, 92, 97, 98, 99, 101, 102, 110, 112, 114, 119, 124, 126, 129, 130, 134, 136, 141], "known": [2, 18, 31], "__init__": [2, 10, 13, 16, 17, 19, 20, 130, 132, 134, 136, 139, 141], "initialis": [2, 7, 18, 23, 111], "By": [2, 7, 8, 18, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 98, 99, 100, 101, 107, 108], "continu": [2, 7, 9, 16, 17, 21, 29, 30, 89, 90, 91, 94, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 119, 122, 124, 133, 136, 139, 141], "current": [2, 3, 7, 11, 14, 16, 18, 19, 24, 89, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 119, 124, 130, 132, 136, 139, 141], "displai": [2, 8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 93, 121, 132], "consumpt": 2, "occur": [2, 7, 18, 92, 93, 132, 136], "repres": [2, 7, 10, 11, 14, 21, 23, 90, 92, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 112, 113, 114, 115, 119, 132, 141], "np": [2, 7, 8, 9, 10, 11, 13, 14, 15, 17, 19, 90, 114, 119, 130, 132, 134, 136, 139, 141], "ndarrai": [2, 4, 7, 8, 10, 11, 12, 13, 14, 17, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 114, 136, 141], "shape": [2, 7, 9, 10, 11, 12, 13, 16, 17, 18, 19, 21, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 117, 124, 130, 132, 134, 136, 141], "x": [2, 9, 12, 90, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 109, 112, 130, 132, 136, 141], "y": [2, 24, 90, 96, 98, 99, 101, 102, 103, 105, 106, 107, 114, 141], "3": [2, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116, 119, 122, 126, 132, 136, 139, 141], "rgb": [2, 7, 16, 18, 19, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 98, 99, 100, 101, 102, 103, 104, 107, 108, 125, 127], "pixel": [2, 7, 16, 19, 89, 109, 132], "imag": [2, 7, 9, 15, 16, 18, 19, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89], "string": [2, 7, 8, 9, 11, 14, 19, 122], "stringio": 2, "style": [2, 15, 18, 109, 122, 124, 141], "represent": [2, 21, 133], "each": [2, 3, 7, 8, 9, 10, 11, 14, 15, 16, 17, 19, 21, 24, 44, 46, 47, 48, 49, 52, 60, 67, 69, 70, 71, 72, 73, 74, 75, 87, 88, 90, 91, 92, 93, 94, 95, 98, 101, 102, 103, 104, 105, 109, 110, 112, 114, 127, 132, 136, 139], "includ": [2, 7, 8, 19, 21, 22, 23, 24, 93, 98, 99, 100, 101, 103, 104, 105, 106, 107, 108, 109, 114, 117, 122, 130, 132, 133], "newlin": 2, "escap": [2, 43, 58, 62], "sequenc": [2, 7, 8, 9, 11, 12, 15, 19, 21, 24, 109, 127, 130], "color": [2, 10, 19, 28, 39, 52, 70, 114], "rgb_array_list": [2, 7, 14, 16, 18, 127], "ansi_list": 2, "base": [2, 3, 4, 7, 10, 15, 16, 18, 21, 48, 57, 74, 87, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 114, 116, 127, 130, 132, 134, 136, 139, 141], "except": [2, 71, 74, 122, 128, 130, 132], "rendercollect": [2, 3, 7, 16, 18, 130], "pop": [2, 106, 124], "kei": [2, 7, 8, 9, 10, 11, 14, 15, 16, 18, 19, 21, 23, 24, 25, 56, 98, 99, 100, 101, 105, 106, 107, 108, 112, 113, 114, 123, 126, 132, 133, 134, 139], "support": [2, 3, 7, 9, 10, 12, 14, 15, 16, 18, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 119, 121, 122, 123, 124, 125, 127, 130, 132], "longer": [2, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 100, 101, 102, 103, 104, 105, 106, 108, 109, 118, 119, 127, 141], "accept": [2, 7, 14, 18, 24, 118, 119, 130, 132], "rather": [2, 23, 89, 109, 136, 139], "v1": [2, 7, 8, 14, 15, 18, 19, 20, 21, 88, 89, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 113, 114, 116, 117, 118, 122, 127, 139], "type": [2, 7, 9, 10, 11, 15, 16, 17, 19, 21, 23, 46, 89, 98, 99, 100, 101, 107, 108, 109, 119, 121, 124, 126, 127, 130, 132, 134, 141], "discret": [2, 7, 9, 10, 12, 13, 15, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 90, 92, 93, 94, 95, 110, 111, 112, 113, 114, 122, 124, 130, 132, 134, 139], "give": [2, 27, 28, 46, 47, 90, 105, 111, 114, 118, 136, 139, 141], "2": [2, 7, 9, 10, 11, 12, 13, 14, 15, 17, 19, 20, 24, 25, 26, 28, 29, 30, 31, 32, 34, 35, 37, 39, 40, 42, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 79, 80, 81, 82, 84, 85, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 122, 127, 132, 134, 136, 139, 141], "mean": [2, 7, 21, 23, 92, 98, 99, 100, 105, 127, 132, 136, 141], "two": [2, 7, 9, 10, 11, 14, 15, 18, 19, 23, 24, 26, 37, 79, 88, 90, 92, 94, 95, 97, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 117, 127, 132, 136, 139], "1": [2, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 119, 122, 124, 126, 127, 132, 133, 134, 136, 139, 141], "box": [2, 7, 9, 10, 12, 13, 15, 16, 17, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 117, 118, 123, 124, 130, 132, 134], "4028234663852886e": 2, "38": [2, 7, 101, 102], "4": [2, 7, 11, 12, 14, 15, 18, 19, 21, 24, 26, 28, 29, 30, 31, 33, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 58, 61, 63, 64, 65, 67, 68, 69, 70, 77, 78, 80, 81, 82, 84, 85, 88, 89, 90, 92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 127, 132, 134, 139, 141], "float32": [2, 7, 10, 11, 12, 13, 15, 16, 17, 19, 21, 88, 89, 90, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "denot": [2, 93], "well": [2, 9, 31, 74, 92, 98, 101, 102, 109, 126, 132, 136], "high": [2, 3, 10, 11, 12, 13, 15, 21, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 124, 130, 134, 136], "8000002e": [2, 7], "00": [2, 7], "4028235e": [2, 7], "1887903e": [2, 7], "01": [2, 7, 20, 90, 98, 99, 102, 103, 104, 105, 106, 107, 130, 136, 139], "dtype": [2, 7, 9, 10, 11, 12, 13, 15, 19, 90, 117, 130, 132], "low": [2, 10, 11, 12, 13, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 124, 134, 136], "etc": [2, 9, 69, 72, 76, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 117, 130, 132, 133, 134], "determin": [2, 11, 24, 90, 92, 93, 94, 95, 96, 109, 113, 127, 132, 133], "inf": [2, 7, 93, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 134], "envspec": [2, 8, 16], "normal": [2, 7, 11, 16, 18, 19, 20, 88, 89, 96, 98, 99, 103, 127, 130, 136, 141], "finish": [2, 89, 90, 124, 136], "code": [2, 4, 7, 9, 10, 14, 15, 16, 18, 19, 20, 92, 109, 116, 119, 120, 124, 130, 132, 134, 136, 137, 139, 141], "clean": 2, "up": [2, 10, 11, 15, 19, 24, 25, 27, 28, 29, 30, 31, 33, 34, 35, 37, 40, 43, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 57, 58, 61, 63, 68, 70, 71, 72, 74, 75, 78, 79, 80, 81, 84, 85, 88, 90, 97, 98, 101, 102, 106, 111, 112, 113, 114, 130, 132, 136, 139], "window": [2, 14, 44, 89, 121, 127, 130, 132], "http": [2, 14, 24, 89, 92, 111, 112, 113, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 132, 136, 139, 141], "connect": [2, 10, 92, 98, 99, 100, 106, 107, 108], "properti": [2, 7, 9, 16, 117, 118, 123, 130, 133], "unwrap": [2, 16, 21, 92], "non": [2, 7, 9, 12, 14, 113, 122, 132, 133, 141], "wrap": [2, 7, 8, 14, 15, 16, 18, 19, 20, 21, 132, 134, 141], "_np_random": [2, 123], "meth": [2, 7], "much": [2, 24, 50, 51, 52, 53, 54, 58, 59, 102, 118, 127, 130, 132, 133], "creat": [2, 3, 7, 8, 11, 13, 14, 15, 18, 21, 34, 88, 89, 90, 105, 106, 130, 134, 136, 139, 141], "creation": [2, 15, 130, 132], "tutori": [2, 16, 21, 23, 130, 134, 136, 139, 141], "gymnasium": [3, 7, 8, 9, 10, 11, 12, 13, 14, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 130, 133, 136, 139, 141], "env": [3, 4, 7, 8, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 112, 113, 114, 115, 116, 117, 119, 120, 122, 123, 124, 127, 128, 129, 130, 133, 134, 135, 137, 139, 141], "flexibl": [3, 15, 109, 130], "implement": [3, 7, 9, 10, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 96, 103, 109, 110, 114, 124, 126, 130, 132, 135, 136, 137, 141], "complic": [3, 11, 16, 134], "parallel": [3, 15, 136], "propos": [3, 7, 109, 130], "funcenv": [3, 130], "part": [3, 18, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 119, 127, 130, 133], "its": [3, 7, 14, 15, 17, 18, 39, 46, 69, 81, 86, 90, 96, 97, 107, 109, 141], "own": [3, 15, 16, 23, 39, 74, 134, 135, 137], "relat": [3, 141], "larg": [3, 15, 23, 95, 98, 99, 100, 101, 102, 105, 106, 107, 108, 109, 116, 117, 119, 124, 130, 134], "believ": [3, 130], "improv": [3, 15, 117, 119, 122, 127, 130], "work": [3, 9, 14, 16, 18, 19, 24, 89, 90, 92, 99, 100, 103, 104, 108, 116, 118, 124, 130], "progress": [3, 10, 80, 130, 136], "arbitrarili": [3, 130], "complex": [3, 9, 10, 101, 102, 103, 104, 130, 136, 141], "rl": [3, 7, 14, 18, 115, 130, 133, 139, 141], "advanc": [3, 15, 92, 130], "becom": [3, 73, 87, 119, 124, 130, 133, 136], "were": [3, 19, 23, 41, 87, 92, 119, 122, 124, 128, 130, 132, 136], "mind": [3, 130], "jax": [3, 7, 109, 130], "With": [3, 112, 130, 136, 139], "hardwar": [3, 122, 130], "acceler": [3, 89, 94, 95, 96, 122, 130, 136], "brax": [3, 109, 130], "written": [3, 14, 16, 23, 130], "similar": [3, 10, 23, 28, 39, 105, 119, 130, 132], "pytorch": [3, 7, 130, 141], "program": [3, 15, 130], "onli": [3, 7, 8, 9, 10, 11, 12, 15, 16, 18, 19, 23, 24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 61, 63, 64, 65, 67, 68, 70, 71, 72, 73, 74, 75, 77, 78, 80, 81, 82, 84, 85, 94, 95, 98, 99, 100, 101, 103, 105, 106, 108, 109, 122, 124, 125, 126, 127, 128, 130, 132, 134, 136, 139], "game": [3, 7, 11, 14, 18, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 63, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 87, 111, 112, 113, 117, 118, 130, 132, 139], "town": [3, 130], "anymor": [3, 7, 130], "upgrad": [3, 118, 127, 130], "jumpi": [3, 130], "project": [3, 21, 23, 109, 119, 124, 127, 130, 139], "develop": [3, 97, 124, 130, 141], "farama": [3, 14, 109, 130, 132, 136, 139, 141], "foundat": [3, 109, 130, 132], "compat": [3, 16, 19, 21, 109, 115, 119, 121, 122, 124, 125, 126, 130], "futur": [3, 4, 80, 109, 119, 122, 124, 130], "subset": [3, 11, 24, 50, 51, 52, 53, 54, 130, 132, 134], "like": [3, 4, 7, 9, 11, 14, 16, 17, 18, 19, 20, 21, 26, 27, 28, 29, 30, 31, 32, 33, 35, 37, 39, 40, 44, 46, 47, 48, 49, 58, 61, 63, 64, 65, 66, 67, 68, 69, 70, 75, 77, 78, 80, 81, 82, 84, 85, 88, 90, 98, 99, 101, 102, 104, 105, 106, 108, 114, 119, 124, 127, 130, 132, 134, 136], "supersuit": [3, 130], "aim": [3, 56, 100, 103, 107, 108, 124, 127, 130, 141], "bring": [3, 130], "mani": [3, 7, 11, 18, 19, 21, 24, 30, 33, 37, 56, 59, 74, 84, 117, 120, 130, 132, 139], "awar": [3, 23, 130], "plan": [3, 109, 119, 124, 127, 130], "miss": [3, 21, 75, 92, 114, 118, 130], "issu": [3, 18, 21, 23, 24, 98, 100, 101, 102, 108, 116, 118, 119, 121, 124, 130, 132], "detail": [3, 9, 14, 18, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 109, 122, 124, 127, 130, 132, 136], "caus": [3, 18, 21, 57, 114, 116, 125, 126, 129, 130], "ad": [3, 7, 16, 18, 19, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 114, 116, 117, 118, 119, 122, 123, 124, 125, 127, 130, 132], "lambaactionv0": [3, 130], "don": [3, 10, 16, 23, 24, 40, 50, 51, 52, 53, 54, 74, 89, 94, 124, 130, 132, 133, 136], "regularli": [3, 130], "signific": [3, 22, 130], "affect": [3, 130], "addition": [3, 101, 102, 127, 130], "hope": [3, 130], "reproduc": [3, 10, 23, 130], "academia": [3, 130], "v28": [3, 130], "rewrit": [3, 123, 130], "vectorenv": [3, 9, 116, 122, 130], "inherit": [3, 9, 16, 17, 19, 20, 21, 117, 130, 132], "replac": [3, 16, 23, 111, 117, 119, 123, 124, 130, 139], "30": [3, 7, 14, 18, 24, 68, 71, 101, 102, 130], "old": [3, 7, 15, 16, 18, 22, 23, 115, 118, 119, 122, 125, 126, 127], "transformobserv": [3, 7, 16, 19], "lambdaobservationv0": [3, 7], "filterobserv": [3, 16, 19], "filterobservationv0": [3, 7], "flattenobserv": [3, 10, 16, 19, 132], "flattenobservationv0": [3, 7], "grayscaleobserv": [3, 16, 19], "grayscaleobservationv0": [3, 7], "resizeobserv": [3, 16, 19, 130], "resizeobservationv0": [3, 7], "reshape_v0": 3, "reshapeobservationv0": [3, 7], "Not": [3, 7, 18], "rescaleobservationv0": [3, 7], "dtype_v0": 3, "dtypeobservationv0": [3, 7], "pixelobservationwrapp": [3, 16, 19, 125, 128], "pixelobservationv0": [3, 7], "normalizeobserv": [3, 16, 19, 117], "normalizeobservationv0": [3, 7], "timeawareobserv": [3, 16, 19, 21], "timeawareobservationv0": [3, 7], "framestack": [3, 7, 16, 18, 19, 117, 125], "framestackobservationv0": [3, 7], "delay_observations_v0": 3, "delayobservationv0": [3, 7], "action_lambda_v1": 3, "lambdaactionv0": [3, 7], "clipact": [3, 16, 17, 21], "clipactionv0": [3, 7], "rescaleact": [3, 7, 16, 17, 21], "rescaleactionv0": [3, 7], "sticky_actions_v0": 3, "stickyactionv0": [3, 7], "transformreward": [3, 16, 20], "lambdarewardv0": [3, 7], "clip_reward_v0": 3, "cliprewardv0": [3, 7], "normalizereward": [3, 16, 20, 117], "normalizerewardv0": [3, 7], "autoresetwrapp": [3, 8, 16, 18, 122, 132], "autoresetv0": [3, 7], "passiveenvcheck": [3, 16, 18, 21, 130], "passiveenvcheckerv0": [3, 7], "orderenforc": [3, 7, 16, 18, 21, 122, 132], "orderenforcingv0": [3, 7], "envcompat": [3, 16, 18, 22, 23, 127], "shimmi": [3, 130], "recordepisodestatist": [3, 16, 18, 23, 117, 136, 139, 141], "recordepisodestatisticsv0": [3, 7], "ataripreprocess": [3, 16, 18], "ataripreprocessingv0": [3, 7], "recordvideo": [3, 16, 18, 23, 117, 124, 127], "recordvideov0": [3, 7, 130], "humanrend": [3, 7, 16, 18, 130], "humanrenderingv0": [3, 7], "rendercollectionv0": [3, 7], "jaxtonumpyv0": [3, 7], "jaxtotorchv0": [3, 7], "numpytotorchv0": [3, 7], "These": [3, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 97, 98, 101, 107, 122, 127, 130, 139, 141], "28": [3, 24, 33, 39, 92, 101, 102], "templat": 4, "meant": 4, "stateless": [4, 130], "manner": [4, 7, 11, 16, 19, 56, 117, 118], "being": [4, 7, 8, 12, 18, 45, 94, 95, 96, 98, 101, 102, 106, 119, 122, 124, 127, 139], "around": [4, 18, 34, 87, 106, 109, 121], "explicitli": [4, 132, 133], "That": [4, 93], "said": [4, 98, 100, 101, 108], "noth": [4, 89, 90, 141], "here": [4, 14, 92, 119, 127, 130, 132, 136], "prevent": [4, 11, 15, 47, 109, 117, 118], "statefulli": 4, "just": [4, 16, 21, 50, 56, 73, 104, 106, 127, 129, 130, 136], "recommend": [4, 7, 8, 15, 18, 23, 24, 50, 51, 52, 53, 54, 90, 98, 101, 102, 117, 124, 126, 132, 136, 139], "consist": [4, 7, 11, 19, 21, 24, 37, 88, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 117, 128, 132, 134, 139, 141], "method": [4, 7, 10, 14, 17, 18, 19, 20, 22, 117, 118, 119, 122, 123, 132, 134, 136, 141], "pomdp": 4, "given": [4, 7, 8, 11, 16, 19, 71, 74, 88, 90, 91, 92, 94, 95, 98, 100, 101, 108, 127, 133, 139], "transit": [4, 14, 21, 24, 50, 51, 52, 53, 54, 101, 102, 112, 113, 114, 133, 136], "next_stat": [4, 139], "state_info": 4, "step_info": 4, "structur": [4, 9, 10, 12, 130, 132], "serv": [4, 9, 98, 99, 100, 101, 107, 108, 141], "purpos": [4, 9, 119, 141], "allow": [4, 7, 8, 9, 10, 14, 16, 21, 22, 23, 24, 55, 73, 92, 93, 94, 95, 96, 103, 104, 105, 106, 109, 122, 124, 126, 127, 128, 130, 132, 134, 136, 141], "constant": [4, 35, 74, 90, 95, 98, 100, 101, 108], "them": [4, 7, 9, 16, 18, 22, 23, 24, 26, 27, 28, 31, 32, 36, 40, 47, 68, 77, 90, 98, 99, 106, 114, 124, 126, 134, 136], "itself": [4, 12, 15, 16, 18, 21, 22, 127, 136], "moment": [4, 74], "predominantli": 4, "intend": [4, 7, 18, 113], "flesh": 4, "offici": 4, "expos": 4, "statetyp": 4, "rewardtyp": 4, "terminaltyp": 4, "full": [4, 21, 24, 50, 51, 52, 53, 54, 89, 90, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 139], "transform": [4, 7, 9, 12, 14, 16, 17, 18, 19, 20, 106, 134], "func": [4, 7], "callabl": [4, 7, 8, 13, 14, 15, 18, 19, 20, 130], "render_imag": 4, "render_st": 4, "renderstatetyp": 4, "show": [4, 19, 23, 24, 34, 40, 111, 122, 134, 136, 139, 141], "render_init": 4, "kwarg": [4, 8, 14, 15, 22, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 132], "render_clos": 4, "experiment": [7, 92, 130], "via": [7, 9, 10, 16, 18, 19, 20, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 91, 97, 109, 110, 132, 141], "lambda": [7, 15, 19, 20, 136, 139], "ob": [7, 14, 17, 18, 19, 114, 119, 124, 127, 129, 130, 134, 139, 141], "42": [7, 10, 11, 13, 15, 17, 19, 93, 101, 102, 115, 130, 136], "06199517": 7, "0511615": 7, "04432538": 7, "02694618": 7, "constructor": [7, 8, 9, 10, 11, 14, 16, 17, 19, 20, 21, 127, 132], "assum": [7, 11, 19, 132], "same": [7, 10, 12, 14, 15, 19, 56, 88, 89, 92, 105, 106, 107, 114, 122, 127, 133, 136, 139], "filter_kei": [7, 19], "filter": [7, 16, 19], "0273956": [7, 15, 19], "00611216": [7, 15, 19], "03585979": [7, 15, 19], "0197368": [7, 15, 19], "fals": [7, 8, 14, 15, 18, 19, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 90, 98, 99, 100, 101, 107, 108, 111, 119, 122, 124, 132, 136, 139, 141], "flatten": [7, 9, 12, 16, 19, 97, 117, 126, 130, 132, 136, 139], "carrac": [7, 8, 14, 19, 89, 122, 124, 126, 128], "v2": [7, 8, 14, 18, 19, 21, 23, 88, 89, 90, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 114, 115, 124, 130, 134, 136], "96": [7, 19, 24, 89], "27648": [7, 19], "_": [7, 13, 14, 15, 17, 18, 19, 20, 21, 115, 134, 136], "util": [7, 21, 22, 117, 124, 132, 136], "flatten_spac": [7, 9, 12], "keep_dim": [7, 19], "grayscal": [7, 18, 19, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "keep": [7, 14, 16, 18, 32, 45, 64, 67, 75, 76, 84, 93, 102, 132], "channel": [7, 18], "dimens": [7, 9, 11, 12, 19, 98, 99, 100, 101, 107, 108, 109, 141], "grayscale_env": 7, "resiz": [7, 16, 18, 19, 130], "opencv": [7, 18, 124], "resized_env": 7, "32": [7, 24, 39, 56, 101, 102, 111, 136, 141], "reshap": 7, "reshape_env": 7, "24": [7, 24, 33, 39, 64, 88, 89, 90, 93, 98, 101, 102, 124, 130, 139], "product": [7, 10, 11], "equal": [7, 94, 95, 103, 111, 113], "min_ob": 7, "float": [7, 8, 11, 12, 14, 16, 17, 19, 20, 24, 55, 68, 90, 98, 99, 100, 101, 107, 108, 132, 136, 139, 141], "max_ob": 7, "linearli": [7, 92, 103, 104, 141], "rescal": [7, 16, 17, 21], "between": [7, 10, 11, 18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 124, 132, 133, 136, 139, 141], "pendulum": [7, 8, 15, 19, 21, 91, 92, 93, 97, 117, 118, 128, 141], "8": [7, 14, 15, 19, 20, 22, 24, 26, 28, 30, 31, 33, 35, 39, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 80, 84, 85, 89, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 113, 127, 136, 141], "10": [7, 10, 11, 24, 31, 37, 50, 51, 52, 53, 54, 61, 68, 71, 74, 88, 90, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 112, 114, 119, 130, 132, 136, 139, 141], "multidiscret": [7, 9, 10, 12, 13, 15, 21, 116, 117, 124, 130, 132], "multibinari": [7, 9, 10, 12, 13, 21], "pixels_onli": [7, 19], "pixels_kei": 7, "obs_kei": 7, "augment": [7, 16, 19], "choos": [7, 19, 132], "origin": [7, 12, 15, 17, 18, 19, 23, 89, 92, 103, 105, 106, 122], "discard": [7, 19], "both": [7, 11, 15, 18, 19, 21, 22, 88, 91, 92, 106, 108, 109, 111, 112, 113, 114, 125, 126, 132, 133, 141], "epsilon": [7, 19, 20, 139], "1e": [7, 19, 20, 101, 107, 108, 141], "coordin": [7, 11, 16, 19, 88, 90, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108], "center": [7, 16, 19, 89, 90, 93, 96, 98, 99, 101, 102], "unit": [7, 9, 16, 19, 58, 92, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "varianc": [7, 16, 19, 20, 136], "past": [7, 19, 20, 124], "trajectori": [7, 16, 19, 20, 90, 101, 102], "newli": [7, 19, 20], "instanti": [7, 10, 14, 18, 19, 20, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 132], "recent": [7, 18, 19, 20, 22], "stabil": [7, 19, 20, 101, 102, 127, 134, 141], "scale": [7, 16, 18, 19, 20, 24, 90, 98, 99, 100, 101, 107, 108, 109, 136], "normalize_tim": 7, "dict_time_kei": 7, "remain": [7, 55, 58, 59, 74, 112, 116, 117, 132, 133], "final": [7, 14, 15, 18, 57, 124, 129, 130, 132, 133, 139], "sampl": [7, 9, 10, 11, 12, 13, 14, 15, 19, 20, 21, 23, 90, 114, 115, 124, 127, 130, 132, 136, 139, 141], "02727336": [7, 15, 19], "20172954": [7, 19], "03625453": [7, 15, 19], "32351476": [7, 19], "002": [7, 100, 108], "0000000e": 7, "5": [7, 10, 11, 12, 13, 17, 24, 26, 28, 29, 30, 31, 34, 35, 37, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 65, 67, 68, 70, 77, 78, 80, 81, 82, 84, 85, 88, 89, 90, 92, 94, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 114, 122, 127, 132, 136, 139, 141], "stack_siz": 7, "stack": [7, 16, 19, 130], "roll": [7, 16, 19, 37, 105, 139], "process": [7, 13, 14, 15, 19, 21, 92, 105, 132, 133, 136], "buffer": [7, 18, 19, 89], "fill": [7, 19, 33, 132], "num_stack": [7, 19], "ident": [7, 11, 15, 19, 130], "255": [7, 18, 19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 130, 132], "uint8": [7, 19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "delai": [7, 132], "delayobserv": 7, "zero": [7, 11, 13, 96, 99, 109, 132, 133, 136, 139, 141], "noop_max": [7, 18], "frame_skip": [7, 18, 98, 99, 100, 101, 107, 108], "screen_siz": [7, 18], "84": [7, 18, 98, 101, 102], "terminal_on_life_loss": [7, 18], "grayscale_ob": [7, 18], "grayscale_newaxi": [7, 18], "scale_ob": [7, 18], "atari": [7, 16, 18, 21, 22, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 116, 117, 118, 119, 127, 129, 130, 139], "2600": [7, 18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "preprocess": [7, 14, 16, 18, 129, 130], "guidelin": [7, 18], "machado": [7, 18, 24], "et": [7, 18, 24], "al": [7, 18, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 116, 117, 118, 122, 127, 130, 139], "2018": [7, 18, 24, 92], "revisit": [7, 18, 24], "arcad": [7, 18, 24, 31, 48, 50, 51, 52, 53, 54, 109], "evalu": [7, 18, 24, 139], "protocol": [7, 18, 24], "open": [7, 18, 24, 37, 97, 109, 127, 130, 132], "problem": [7, 18, 24, 90, 93, 96, 103, 104, 107, 109, 111, 114, 115, 133, 136], "stage": [7, 18, 130], "noop": [7, 11, 14, 18, 24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 114, 136], "obtain": [7, 16, 18, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 96, 111, 133, 141], "op": [7, 18], "max": [7, 11, 17, 18, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 113, 136, 139, 141], "skip": [7, 14, 18, 24, 125, 132], "pool": [7, 18, 107], "life": [7, 18, 30, 44, 48, 72, 76, 119, 141], "lost": [7, 18, 33, 41, 60, 73, 77], "loss": [7, 18, 111, 136, 141], "turn": [7, 15, 18, 23, 27, 28, 89, 90, 103, 109, 122, 124, 127], "off": [7, 18, 23, 41, 56, 64, 72, 89, 90, 112, 114, 122, 127], "squar": [7, 18, 19, 73, 105, 106, 114, 132, 136], "210x180": [7, 18], "84x84": [7, 18], "colour": [7, 18, 89, 128], "greyscal": [7, 18], "No": [7, 18, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 127, 141], "taken": [7, 15, 18, 48, 54, 91, 93, 132, 136, 141], "effect": [7, 12, 13, 16, 18, 19, 21, 24, 50, 51, 52, 53, 54, 90, 103, 104, 114, 139, 141], "frequenc": [7, 18], "experi": [7, 18, 98, 101, 102, 103, 104, 136, 139, 141], "whenev": [7, 18, 23, 30, 33, 132], "grai": [7, 16, 18, 19], "axi": [7, 18, 94, 95, 99, 101, 102, 107, 139], "dimension": [7, 9, 18, 19, 21, 28, 90, 98, 99, 100, 106, 107, 108, 130, 132, 136], "limit": [7, 8, 18, 21, 23, 40, 48, 55, 56, 69, 74, 103, 104, 130, 135, 136, 137, 139, 141], "memori": [7, 18, 19, 94, 95, 126], "optim": [7, 18, 24, 88, 90, 101, 102, 109, 136, 139, 141], "benefit": [7, 18], "rais": [7, 8, 11, 12, 13, 14, 15, 18, 19, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 125, 128, 130], "dependencynotinstal": [7, 14, 18], "valueerror": [7, 11, 12, 13, 15, 18, 19], "disabl": [7, 8, 18, 113, 122, 123, 124], "wrapperacttyp": [7, 16, 17], "lambdaact": 7, "clip": [7, 16, 17, 21, 94, 95, 98, 101, 132, 134, 136], "hopper": [7, 8, 16, 17, 97, 108], "v4": [7, 8, 16, 17, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 122, 123, 130, 141], "disable_env_check": [7, 8, 15, 122], "min_act": [7, 16, 17, 21], "max_act": [7, 16, 17, 21], "affin": [7, 17, 90], "must": [7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 21, 23, 24, 25, 26, 29, 31, 32, 33, 34, 36, 40, 41, 42, 45, 48, 49, 58, 62, 64, 65, 70, 89, 100, 108, 126, 132, 133], "match": [7, 12, 15, 17, 79], "75": [7, 17, 98], "wrapped_env": [7, 16, 17, 18, 21, 132, 134, 141], "wrapped_env_ob": [7, 17], "alltru": [7, 17], "min": [7, 11, 17, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111], "scalar": [7, 11, 17, 124], "repeat_action_prob": [7, 24, 50, 51, 52, 53, 54], "probabl": [7, 9, 24, 112, 113, 114, 133, 136, 139, 141], "repeat": [7, 24, 105], "previou": [7, 18, 23, 98, 101, 102, 133, 134], "section": [7, 23, 24, 75, 98, 99, 100, 101, 107, 108, 132, 139], "page": [7, 16, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 130], "12": [7, 12, 24, 31, 33, 37, 39, 50, 51, 52, 53, 54, 58, 61, 73, 90, 92, 93, 98, 99, 100, 101, 102, 105, 108, 111, 112, 130, 136, 139], "stickyact": 7, "rew": [7, 14, 133], "min_reward": [7, 134], "max_reward": [7, 134], "upper": [7, 11, 21, 101, 102, 122], "lower": [7, 11, 21, 98, 99, 100, 101, 102, 105, 106, 107, 108, 122, 126, 136, 139], "cliprewardsv0": 7, "union": [7, 10, 11, 12, 13, 14, 15, 17], "higher": [7, 88, 136], "gamma": [7, 20, 133, 136, 141], "99": [7, 20, 136, 141], "immedi": [7, 14, 16, 20, 111, 132], "exponenti": [7, 11, 16, 20], "averag": [7, 16, 20, 101, 133, 139, 141], "fix": [7, 9, 10, 11, 16, 18, 20, 21, 23, 57, 92, 93, 96, 97, 98, 99, 100, 101, 103, 104, 108, 111, 113, 118, 119, 120, 121, 122, 127, 130, 132, 141], "_update_running_mean": 7, "freez": 7, "calcul": [7, 96, 97, 98, 101, 102, 103, 105, 106, 112, 113, 114, 136], "statist": [7, 14, 18, 141], "runningmeanstd": 7, "get": [7, 16, 21, 24, 44, 47, 48, 49, 56, 66, 67, 68, 69, 71, 72, 73, 78, 88, 90, 98, 100, 101, 103, 111, 124, 130, 133, 136, 139], "discount": [7, 20, 133, 136, 139, 141], "factor": [7, 20, 136, 139, 141], "passiv": [7, 18, 125], "checker": [7, 8, 15, 18, 123, 125, 130], "surround": [7, 18], "thei": [7, 9, 15, 18, 19, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 106, 110, 111, 112, 113, 132, 136], "test": [7, 18, 88, 109, 116, 118, 122, 123, 125, 130, 132, 141], "disable_render_order_enforc": [7, 18, 122], "error": [7, 8, 11, 12, 14, 16, 18, 118, 119, 121, 122, 130, 133, 136, 139], "resetneed": [7, 18], "cannot": [7, 12, 13, 18, 21, 23, 112, 126, 132, 133], "order": [7, 8, 9, 10, 16, 18, 21, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 122, 126, 130, 132], "enforc": [7, 8, 18, 118, 122], "buffer_length": 7, "100": [7, 10, 12, 18, 38, 48, 71, 72, 88, 89, 90, 92, 95, 100, 105, 112, 113], "stats_kei": 7, "track": [7, 14, 16, 18, 76, 89, 93, 98, 99, 100, 101, 102, 103, 104, 107, 108], "cumul": [7, 14, 16, 18], "length": [7, 8, 10, 11, 14, 16, 18, 19, 88, 92, 93, 94, 95, 99, 107, 109, 113, 114, 124, 136, 139], "At": [7, 18, 21, 33, 44, 47, 58], "vector": [7, 11, 14, 16, 18, 88, 90, 102, 103, 104, 105, 106, 119, 122, 127, 129, 130, 135, 137, 141], "_episod": [7, 18], "respect": [7, 11, 15, 16, 18, 21, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 98, 101, 102, 107, 119, 134, 136], "look": [7, 9, 14, 16, 18, 21, 24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 58, 61, 63, 64, 65, 67, 68, 70, 73, 75, 77, 78, 80, 81, 82, 84, 85, 132, 133, 134, 136], "l": [7, 18, 107], "elaps": [7, 18], "sinc": [7, 18, 22, 24, 50, 51, 52, 53, 54, 87, 93, 97, 106, 109, 114, 116, 124, 132, 133], "begin": [7, 18, 23, 30, 33, 46, 71, 72, 73, 74, 127, 132, 136, 139], "form": [7, 9, 10, 11, 18, 92, 107, 130, 132], "final_observ": [7, 15, 18, 129, 130], "num": [7, 18, 24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "_final_observ": [7, 18], "final_info": [7, 15, 18, 129, 130], "_final_info": [7, 18], "moreov": [7, 9, 16, 18, 24, 27, 37, 132, 134], "store": [7, 14, 15, 18, 141], "access": [7, 16, 18, 23, 55, 123, 130, 134], "return_queu": [7, 18, 136, 139, 141], "length_queu": [7, 18, 139], "episode_reward_buff": 7, "last": [7, 14, 18, 46, 47, 57, 99, 102, 105, 106, 118, 124, 127, 132, 133], "deque_s": [7, 18, 136, 139], "episode_length_buff": 7, "size": [7, 9, 18, 113, 128, 132], "video_fold": [7, 14, 18], "episode_trigg": [7, 14, 18], "step_trigg": [7, 14, 18], "video_length": [7, 14, 18], "name_prefix": [7, 14, 18], "disable_logg": [7, 18], "record": [7, 14, 16, 18, 88, 116, 117, 127, 136, 141], "rollout": [7, 16, 18, 114], "intermitt": [7, 18], "sai": [7, 18, 127, 134], "hundredth": [7, 18], "do": [7, 16, 18, 19, 24, 37, 49, 70, 74, 75, 89, 90, 92, 98, 99, 100, 101, 107, 108, 127, 130, 132, 134, 136, 141], "neither": [7, 11, 18, 111], "nor": [7, 11, 18, 111, 112], "emploi": [7, 18], "capped_cubic_video_schedul": [7, 14], "power": [7, 27, 55, 89, 90, 95, 103, 104, 141], "until": [7, 15, 16, 47, 60, 105, 111, 112, 113, 119, 132, 136, 141], "1000": [7, 14, 18, 21, 72, 74, 89, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 115, 136, 141], "stop": [7, 18, 21, 68, 78, 86, 111, 133, 139], "possibli": [7, 9, 10, 11, 13, 16, 18, 21, 109, 136], "span": [7, 18], "sever": [7, 8, 11, 18, 21, 23, 24, 54, 109, 125, 127, 130], "strictli": [7, 18], "per": [7, 11, 15, 37, 56, 79, 114, 119, 133, 136], "iff": [7, 14, 18, 132], "entir": [7, 14, 18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 100, 108, 109, 118, 130, 136], "snippet": [7, 14, 18], "captur": [7, 14, 18, 83], "Will": [7, 14, 18], "prepend": [7, 14, 18], "filenam": [7, 14, 18], "moviepi": [7, 14, 18, 124, 127], "logger": [7, 18], "particularli": [7, 14, 18, 93], "haven": [7, 18], "screen": [7, 18, 24, 26, 30, 34, 39, 40, 42, 51, 57, 63, 73, 74, 98, 99, 100, 101, 102, 103, 104, 107, 108, 122], "rememb": [7, 15, 18, 89, 132, 134], "render_fp": [7, 14, 18, 132], "either": [7, 10, 11, 12, 14, 18, 19, 21, 22, 24, 47, 57, 94, 95, 98, 111, 113, 136, 141], "lunarland": [7, 8, 18, 21, 23, 90, 115, 130, 136], "simpli": [7, 17, 18, 19, 20, 24, 132], "nativ": [7, 18], "cartpolejax": [7, 18], "warn": [7, 10, 14, 15, 18, 116, 118, 121, 123, 125, 129, 130], "alwai": [7, 11, 12, 18, 24, 90, 94, 95, 98, 101, 102, 105, 107, 111, 112, 113, 114, 130, 132], "empti": [7, 11, 13, 18, 74, 139, 141], "pop_fram": [7, 18], "reset_clean": [7, 18], "renderedfram": 7, "clear": [7, 18, 78], "interact": [7, 9, 14, 24, 109, 132, 136, 139], "guarante": [7, 10, 24], "roundtrip": 7, "vice": [7, 13, 18], "versa": [7, 13, 18], "int_32": 7, "devicearrai": 7, "jnp": 7, "int23": 7, "input": [7, 14, 15, 19, 21, 136, 139], "devic": [7, 136], "tensor": [7, 136, 141], "torch": [7, 136, 141], "load": [8, 118], "pre": [8, 113, 130], "id": [8, 15, 113, 132], "liter": 8, "mountaincar": [8, 94], "mountaincarcontinu": [8, 95], "acrobot": [8, 91, 117], "lunarlandercontinu": [8, 134], "bipedalwalk": [8, 21, 88, 125, 128], "v3": [8, 21, 88, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 114, 122], "bipedalwalkerhardcor": 8, "blackjack": [8, 21, 110, 117, 119, 124, 130, 137, 140], "frozenlak": [8, 14, 113, 116, 130], "frozenlake8x8": [8, 116], "cliffwalk": [8, 112, 125], "taxi": [8, 110, 124], "reacher": [8, 97, 105, 130, 134], "pusher": [8, 97, 130], "invertedpendulum": [8, 97, 103, 104, 141], "inverteddoublependulum": [8, 103], "halfcheetah": [8, 97, 99], "swimmer": [8, 97, 125, 127], "walker2d": [8, 97], "ant": [8, 97, 100, 108, 122, 130], "humanoidstandup": [8, 97, 102], "humanoid": [8, 45, 97, 98, 130], "accord": [8, 10, 11, 15, 90, 136], "find": [8, 24, 25, 50, 51, 52, 53, 54, 60, 69, 81, 103, 106, 130, 132], "avail": [8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 109, 111, 112, 122, 130, 132], "modul": [8, 9, 13, 16, 122, 128, 132, 134, 136, 141], "eg": [8, 14, 132], "max_episode_step": [8, 18, 132, 136], "autoreset": [8, 15, 132], "apply_api_compat": [8, 22, 127], "stepapicompat": [8, 16, 18, 22, 130], "argument": [8, 9, 10, 11, 12, 14, 15, 19, 21, 22, 87, 91, 110, 116, 119, 123, 127, 132, 139], "addit": [8, 9, 15, 18, 21, 23, 24, 30, 41, 71, 75, 90, 91, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 114, 119, 124, 127, 130, 132, 136, 139, 141], "entry_point": [8, 127, 132], "reward_threshold": [8, 98, 99, 100, 101, 102, 105, 106, 107, 108, 132], "nondeterminist": [8, 132], "order_enforc": [8, 132], "syntax": 8, "namespac": [8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 132], "env_nam": [8, 22], "v": [8, 73, 94, 103, 136], "keyword": [8, 10, 15, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 111, 124, 132, 139], "entri": [8, 23, 118], "point": [8, 12, 14, 16, 24, 27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 45, 46, 47, 48, 49, 51, 55, 56, 59, 66, 67, 68, 69, 70, 71, 72, 74, 76, 77, 78, 80, 81, 84, 88, 89, 90, 92, 93, 96, 106, 111, 118, 124, 133], "threshold": [8, 92, 93, 114, 132], "consid": [8, 89, 90, 91, 97, 98, 100, 101, 108, 132, 134], "learnt": 8, "knowledg": 8, "enabl": [8, 16, 24, 89, 109, 118, 122, 124], "correct": [8, 114, 128, 130, 132, 133], "pprint_registri": [8, 130], "env_id": [8, 22, 130], "retriev": [8, 18, 45, 48, 74], "global": 8, "_registri": 8, "num_col": 8, "exclude_namespac": 8, "disable_print": 8, "column": [8, 141], "arrang": 8, "exclud": [8, 98, 99, 100, 101, 107, 108], "instead": [8, 15, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 92, 108, 119, 122, 127, 132, 136], "consol": [8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "variou": [9, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 102, 109, 118, 141], "mathemat": [9, 141], "environ": [9, 11, 13, 16, 17, 18, 19, 20, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 110, 111, 112, 113, 114, 117, 118, 122, 123, 124, 125, 126, 127, 129, 130, 133, 134, 135, 137, 141], "three": [9, 16, 19, 24, 27, 30, 32, 45, 53, 59, 66, 71, 72, 73, 74, 98, 100, 101, 102, 107, 108, 119, 132], "cube": [9, 70], "superclass": [9, 17, 19, 20], "npt": [9, 10, 11], "dtypelik": 9, "crucial": 9, "clearli": 9, "u": [9, 24, 127, 132, 134, 139, 141], "highli": [9, 23, 24, 87, 91, 109, 124, 132], "data": [9, 12, 14, 16, 23, 123, 124, 130, 132, 134, 136, 139, 141], "painlessli": 9, "flat": [9, 10, 11, 12, 19], "especi": [9, 132, 134, 136], "hierarch": [9, 114], "build": [9, 26, 44, 48, 103, 108, 130, 134], "express": [9, 14, 98, 101, 102], "cover": [9, 139], "parametr": [9, 141], "distribut": [9, 10, 11, 107, 109, 113, 118, 136, 141], "batch": [9, 13, 15, 119, 122, 136], "handl": [9, 15, 103, 111, 117, 121, 135, 137, 139], "care": [9, 75], "immut": 9, "is_np_flatten": [9, 130], "mask": [9, 10, 11, 23, 114, 124, 127, 136], "t_cov": 9, "randomli": [9, 10, 90, 113, 124, 132, 136], "uniform": [9, 11, 12, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "bounded": 9, "int8": [9, 11], "member": [9, 58], "subspac": [9, 10, 11, 12, 126], "to_json": 9, "sample_n": 9, "jsonabl": 9, "from_json": 9, "matric": [9, 109], "binari": [9, 11, 21, 132], "hold": [9, 111, 139], "down": [9, 11, 24, 28, 30, 31, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 57, 58, 61, 63, 65, 66, 68, 70, 78, 80, 81, 84, 85, 89, 102, 111, 112, 113, 114, 132, 133, 139], "button": [9, 11, 14, 21], "multipl": [9, 10, 11, 13, 15, 122, 136], "ax": [9, 11, 132, 136, 139], "messag": [9, 118, 119, 124, 130], "mission": [9, 57, 59, 60], "join": [9, 130], "togeth": [9, 24, 97], "vectoris": [9, 109], "separ": [9, 10, 23, 130, 132, 136], "readabl": [9, 10, 130], "unord": 9, "entiti": 9, "select": [9, 11, 47, 98, 101, 102, 105, 106, 130, 136], "graph": [9, 12, 21, 124, 127, 136, 139], "node": [9, 10, 12, 124], "edg": [9, 10, 12, 93, 124], "unflatten": [9, 12, 130], "neural": [9, 12, 92, 107, 109, 136, 141], "network": [9, 12, 107, 136], "flatdim": [9, 12, 117], "revers": [9, 12, 111, 136, 141], "batch_spac": [9, 13], "concaten": [9, 12, 13, 97], "iter": [9, 10, 13, 15], "create_empty_arrai": [9, 13], "create_shared_memori": [9, 13], "read_from_shared_memori": [9, 13], "write_to_shared_memori": [9, 13], "spaces_kwarg": 10, "constitu": 10, "usag": [10, 11, 12, 89, 134], "ordereddict": [10, 13, 19], "nest": [10, 13, 109], "ext_control": 10, "inner_st": 10, "charg": 10, "system_check": 10, "job_statu": 10, "conveni": [10, 16, 21, 132], "easili": [10, 16, 127], "deal": [10, 136], "avoid": [10, 13, 16, 21, 24, 27, 28, 30, 35, 36, 44, 46, 62, 63, 65, 70, 72, 73, 78, 112, 114], "independ": [10, 11, 15, 100, 106, 107, 108], "attr": 10, "uniqu": [10, 87, 91, 97, 103, 126], "sub": [10, 15, 74], "precis": [10, 116], "cartesian": [10, 11, 96], "3991573": 10, "21649833": 10, "involv": [10, 87, 103, 104, 109, 112, 113, 114, 124, 130, 132, 141], "draw": [10, 111, 132, 139], "54": 10, "finit": [10, 11, 98, 102, 103, 104, 105, 106, 108, 133, 134, 141], "a_0": 10, "dot": [10, 11, 132], "a_n": 10, "a_i": 10, "belong": [10, 13], "n": [10, 11, 12, 13, 21, 24, 43, 89, 92, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 136, 139, 141], "6369617": 10, "01652764": 10, "8132702": 10, "length_mask": 10, "sample_mask": 10, "drawn": [10, 11, 105, 107, 111], "geometr": 10, "featur": [10, 11, 109, 122, 130, 136], "feature_spac": 10, "node_spac": [10, 12], "edge_spac": [10, 12], "seri": [10, 21], "adjac": 10, "matrix": 10, "edge_link": [10, 12], "num_nod": 10, "num_edg": 10, "graphinst": [10, 12, 129, 130], "edge_mask": 10, "multipli": [10, 95, 136], "attribut": [10, 21, 23, 105, 106, 132, 134], "unbound": 11, "mathbb": 11, "interv": [11, 21, 98, 100, 101, 108], "There": [11, 16, 21, 56, 57, 69, 88, 90, 91, 94, 95, 97, 102, 103, 104, 105, 106, 109, 112, 114, 116, 130, 132], "common": [11, 16, 21, 130, 133, 134, 141], "construct": [11, 24, 50, 51, 52, 53, 54, 92, 98, 99, 100, 101, 107, 108], "across": [11, 13, 30, 40, 51, 52, 55], "infer": [11, 97, 124], "essenti": 11, "shift": [11, 21], "unsupport": 11, "is_bound": 11, "sens": [11, 109], "One": [11, 21, 98, 101, 102], "smallest": 11, "maskndarrai": 11, "uniformli": [11, 24, 92, 93, 105, 106, 132], "infeas": 11, "sort": 11, "fair": 11, "coin": 11, "toss": 11, "nvec": 11, "int64": [11, 12, 130], "keyboard": [11, 14, 122], "nintendo": 11, "conceptu": 11, "arrow": [11, 68], "left": [11, 24, 26, 28, 29, 30, 31, 35, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 61, 63, 64, 65, 67, 70, 74, 75, 77, 78, 80, 81, 84, 85, 88, 89, 90, 93, 94, 98, 101, 102, 103, 104, 108, 112, 113, 114, 132, 139, 141], "param": 11, "press": [11, 14, 21, 89, 92], "although": 11, "rare": [11, 126], "d": [11, 14, 16, 92, 105, 106, 136], "categor": [11, 136], "count": [11, 88, 90, 111, 139], "kind": 11, "unless": [11, 16, 111, 112, 113, 114, 127, 132], "max_length": 11, "min_length": 11, "charset": 11, "alphanumer": 11, "compris": 11, "charact": [11, 14, 58, 69], "b5": 11, "hello": 11, "0123456789abcdefghijklmnopqrstuvwxyzabcdefghijklmnopqrstuvwxyz": 11, "0123456789": 11, "digit": [11, 109], "inclus": [11, 24, 118], "english": 11, "alphabet": 11, "plu": [11, 40, 112], "latin": 11, "charlist": 11, "matter": [11, 126], "attempt": [12, 90, 102, 103, 114], "compound": 12, "equival": [12, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 124, 136], "oper": [12, 18, 123], "boundari": 12, "while": [12, 23, 24, 27, 28, 44, 59, 62, 63, 64, 65, 68, 70, 72, 74, 78, 81, 83, 90, 92, 93, 96, 98, 99, 101, 102, 105, 106, 107, 111, 112, 127, 132, 133, 136, 139, 141], "exactli": [12, 107], "necessarili": 12, "hot": 12, "encod": [12, 114, 126, 132], "60": [12, 58, 71, 109, 130], "recurs": 12, "6": [12, 24, 28, 29, 30, 31, 35, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 65, 79, 80, 81, 84, 85, 92, 94, 95, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 112, 114, 122, 130, 141], "float64": 12, "notimplementederror": 12, "int32": 12, "15": [12, 24, 47, 50, 51, 52, 53, 54, 58, 77, 90, 98, 99, 101, 102, 105, 108, 109, 113, 136], "datapoint": 12, "k": [12, 14, 90, 107, 136], "m": [12, 24, 43, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 116, 132, 136], "would": [12, 17, 19, 20, 98, 99, 100, 101, 102, 107, 108, 115, 124, 128, 130, 132, 134, 136], "copi": [13, 15, 132], "item": [13, 14, 109, 136, 139], "77395606": 13, "43887845": 13, "85859793": 13, "697368": 13, "09417735": 13, "97562236": 13, "stopiter": 13, "fn": 13, "multi_binari": 13, "built": [13, 23, 109, 119, 130], "multi_discret": 13, "ctx": 13, "mp": 13, "multiprocess": [13, 15], "opt": 13, "hostedtoolcach": 13, "9": [13, 15, 24, 28, 31, 36, 45, 50, 51, 52, 53, 54, 58, 61, 71, 80, 85, 92, 96, 98, 99, 100, 101, 102, 103, 105, 106, 108, 111, 136, 139], "16": [13, 24, 33, 36, 39, 45, 50, 51, 52, 53, 54, 58, 96, 98, 99, 101, 102, 105, 108, 113, 130, 139, 141], "x64": 13, "lib": [13, 112], "python3": 13, "eventu": 13, "shared_memori": [13, 15], "customspaceerror": 13, "read": [13, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 129, 130], "forward": [13, 35, 57, 88, 98, 99, 100, 101, 102, 107, 108, 118, 122, 123, 136, 141], "side": [13, 19, 26, 39, 54, 56, 90], "write": [13, 15, 130, 132], "num_env": [13, 15, 136], "plai": [14, 21, 34, 47, 60, 79, 84, 89, 109, 122, 124, 130, 132, 139], "transpos": [14, 132], "zoom": 14, "callback": [14, 123], "keys_to_act": [14, 124, 136], "w": [14, 98, 101, 102, 136], "7": [14, 24, 28, 30, 31, 35, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 65, 80, 81, 84, 85, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 122, 136], "dw": 14, "verifi": 14, "level": [14, 16, 21, 24, 31, 48, 70, 78, 109], "unplay": 14, "wish": [14, 19, 23, 122], "real": [14, 56, 99], "playplot": 14, "150": 14, "def": [14, 132, 134, 136, 139, 141], "obs_t": 14, "obs_tp1": 14, "plotter": 14, "amount": [14, 44, 46, 47, 49, 55, 74, 88, 93, 103, 104, 141], "receiv": [14, 15, 21, 34, 37, 41, 44, 45, 51, 57, 60, 89, 90, 95, 108, 114, 124, 133, 136, 139, 141], "map": [14, 19, 21, 42, 113, 114, 130, 132, 139, 141], "unicod": 14, "suppos": 14, "trigger": [14, 114], "key_to_act": 14, "ord": [14, 132], "unknown": [14, 109], "horizon_timestep": 14, "plot_nam": 14, "live": [14, 27, 30, 33, 34, 36, 39, 44, 45, 48, 55, 59, 60, 66, 72, 77, 139], "compute_metr": 14, "obs_tp": 14, "cumulative_reward": 14, "linalg": [14, 132], "norm": [14, 105, 106, 132], "along": [14, 16, 21, 22, 58, 59, 61, 72, 89, 93, 94, 95, 99, 103, 104, 107, 112, 124, 130], "conjunct": 14, "evolv": 14, "200": [14, 49, 72, 90, 92, 93, 94, 96, 113, 114], "magnitud": [14, 90, 95, 103, 104, 141], "your_env": 14, "len": [14, 134, 136, 139], "horizon": [14, 74, 100, 108, 133], "titl": [14, 94, 95, 139, 141], "matplotlib": [14, 136, 139, 141], "playablegam": 14, "process_ev": 14, "event": [14, 121, 132], "particular": [14, 16, 19, 21, 22, 90, 130, 133], "exit": [14, 15], "save_video": [14, 127], "episode_index": 14, "step_starting_index": 14, "extract": 14, "compos": 14, "isn": 14, "imagesequenceclip": 14, "durat": [14, 98, 100, 101, 102, 103, 104, 105, 106, 108, 117, 141], "step_index": 14, "199": 14, "episode_id": 14, "27": [14, 92, 98, 101, 102], "729": 14, "2000": [14, 88, 114], "3000": 14, "schedul": [14, 113], "step_api_compat": [14, 22], "step_return": 14, "output_truncation_bool": [14, 18], "is_vector_env": 14, "doc": [14, 18, 90, 118, 130, 134], "interfac": [14, 115], "conflict": [14, 109], "desir": [14, 107, 108, 114, 136], "vec_env": 14, "convert_to_terminated_truncated_step_api": [14, 22], "irrespect": 14, "convert_to_done_step_api": 14, "omit": [14, 97, 98, 99, 100, 101, 102, 107, 108], "env_check": [14, 122], "check_env": [14, 130], "skip_render_check": 14, "invas": [14, 78], "org": [14, 24, 130, 136, 139, 141], "content": 14, "environment_cr": [14, 132], "ignor": [14, 24, 111, 122, 124, 139], "ci": [14, 116, 117, 118, 121, 129, 130], "linear": [15, 90, 92, 103, 104, 107, 136, 141], "speed": [15, 35, 88, 89, 130, 136], "wait": [15, 48, 50, 74, 127, 133], "overwritten": [15, 16, 124, 129, 130], "asyncvectorenv": [15, 130, 136], "syncvectorenv": 15, "single_observation_spac": [15, 136], "single_action_spac": [15, 136], "v25": [15, 23], "vectorlistinfo": [15, 16, 18, 122], "share": [15, 141], "other": [15, 17, 18, 19, 22, 30, 39, 42, 50, 56, 90, 96, 97, 99, 103, 105, 106, 108, 113, 114, 117, 118, 127, 130, 132, 134, 136, 139, 141], "word": [15, 105, 141], "01522993": 15, "04562247": 15, "04799704": 15, "03392126": 15, "03774345": 15, "02418869": 15, "00942293": 15, "0469184": 15, "18847767": 15, "26141977": 15, "01431748": 15, "24002443": 15, "04731862": 15, "3110827": 15, "03822722": 15, "1710671": 15, "00848456": 15, "2487226": 15, "releas": [15, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 132], "resourc": [15, 132, 139], "viewer": [15, 130], "close_extra": 15, "synchron": 15, "asynchron": 15, "garbag": 15, "registri": [15, 21, 122, 130], "env_fn": 15, "context": [15, 141], "daemon": 15, "worker": [15, 68], "pipe": [15, 118], "commun": [15, 23, 124, 127], "81": [15, 96, 130], "62": 15, "14995256": 15, "9886932": 15, "12224312": 15, "5760367": 15, "8174238": 15, "91244936": 15, "back": [15, 16, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 98, 99], "effici": [15, 19, 94, 95, 103, 130, 136], "subprocess": 15, "flag": [15, 94, 109], "quit": [15, 132], "head": [15, 99], "spawn": [15, 106, 136], "children": 15, "overrid": [15, 134], "inner": 15, "logic": [15, 89, 118, 132], "degre": [15, 101, 102, 103, 134, 136], "chanc": 15, "shoot": [15, 31, 40, 42, 47, 48, 55, 56, 65, 68, 72, 77, 78, 86], "yourself": [15, 48, 68, 89, 132, 139], "foot": [15, 99, 100, 108], "thu": [15, 24, 50, 51, 52, 53, 54, 105, 106, 109, 136], "_worker": 15, "_worker_shared_memori": 15, "runtimeerror": 15, "serial": [15, 136], "without": [16, 21, 23, 46, 101, 111, 113, 119, 125, 129, 130, 132, 139], "alter": [16, 21, 24, 132], "lot": [16, 21, 134, 139, 141], "boilerpl": [16, 21, 132, 134], "modular": [16, 21, 109, 132, 134], "chain": [16, 21, 92, 107], "base_env": [16, 21], "underneath": [16, 21, 93], "anoth": [16, 39, 101, 102, 104, 105, 106, 108, 114, 129, 133, 139, 141], "hopperenv": 16, "layer": [16, 21, 141], "bare": 16, "hopper_v4": 16, "0x7fbb5efd0490": 16, "thing": [16, 24, 119, 127, 134], "Such": [16, 134], "actionwrapp": [16, 17], "observationwrapp": [16, 19, 132], "rewardwrapp": [16, 20], "behavior": [16, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 96, 98, 99, 100, 101, 102, 107, 108, 109, 117, 119, 132, 134], "forget": [16, 132], "wrapperobstyp": [16, 19], "commonli": [16, 21, 127], "found": [16, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 97, 109, 122, 139, 141], "descript": [16, 130, 132], "misc": 16, "tp": 16, "21": [16, 22, 98, 101, 102, 105, 111, 119, 130, 136, 139], "request": [16, 111], "anobserv": 16, "save": [16, 18, 23, 118, 134], "axbxc": [16, 19], "append": [16, 19, 136, 139, 141], "th": 16, "overwrit": [17, 19, 20], "domain": [17, 89, 92, 94, 95, 114, 134, 135, 137], "among": [17, 19, 91, 97], "new_ob": 18, "final_reward": 18, "final_termin": 18, "final_trunc": 18, "final_don": 18, "prior": 18, "alongsid": 18, "re": [18, 56, 71, 74, 118, 122, 130, 132, 141], "old_env": 18, "legacyenv": 18, "retun": 18, "modern": [18, 109], "convers": [18, 22, 109], "cartpoleenv": 18, "place": [18, 28, 93, 94, 95, 132, 136], "\u01f9one": 18, "outermost": 18, "reflect": [19, 93, 124], "f": [19, 20, 136, 139, 141], "ideal": 19, "subclass": 19, "accordingli": [19, 74, 132], "incorrectli": [19, 133], "randn": [19, 119, 127], "20380084": 19, "03390356": 19, "13373359": 19, "24382612": 19, "lz4_compress": 19, "lazyfram": 19, "lz4": 19, "compress": 19, "singleton": 19, "axbx1": 19, "axb": 19, "render_kwarg": 19, "pixel_kei": 19, "odict_kei": 19, "400": [19, 114], "600": [19, 136], "assertionerror": 19, "typeerror": 19, "unexpect": [19, 117], "64": [19, 24, 130], "invari": 20, "incorrect": [20, 114, 124, 125, 133], "mountain": [21, 91, 125], "car": [21, 33, 49, 87, 91, 109, 122, 124, 125], "four": [21, 33, 44, 89, 90, 98, 100, 108, 114, 139], "introduc": [21, 22, 23, 98, 101, 102, 123, 124], "core": [21, 124, 127, 130], "markov": [21, 133], "decis": [21, 23, 109, 127, 133], "theori": [21, 96, 103, 124, 136], "perfect": 21, "reconstruct": 21, "compon": [21, 132], "veri": [21, 90, 105, 116, 127, 128, 129, 130, 132, 136], "easi": [21, 60, 110, 127], "classic": [21, 23, 90, 92, 93, 94, 95, 96, 100, 104, 107, 108, 117, 122, 124, 130, 133], "loop": [21, 23, 109, 136, 139], "pictur": 21, "simplifi": [21, 96, 122, 126, 130], "someth": [21, 127], "spaceship": [21, 31, 45, 76], "land": [21, 38, 72, 90], "safe": [21, 68, 90], "document": [21, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 91, 98, 101, 102, 103, 110, 116, 118, 119, 130, 132, 136, 139], "imagin": [21, 109, 134], "robot": [21, 23, 36, 86, 88, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 119, 133], "destroi": [21, 27, 29, 31, 32, 33, 34, 35, 36, 39, 40, 41, 42, 45, 46, 54, 60, 71, 72, 73, 76, 77, 78, 80, 90], "enemi": [21, 28, 29, 32, 34, 35, 36, 42, 45, 46, 48, 61, 70, 71, 73, 74, 76, 77, 78, 80, 86], "exchang": 21, "crash": [21, 90], "succeed": 21, "similarli": [21, 90, 130], "restart": 21, "train": [21, 23, 118, 122, 130, 135], "major": [21, 124, 130], "our": [21, 130, 132, 136, 139], "simpl": [21, 88, 110, 115, 133, 141], "coupl": [21, 136], "nich": 21, "li": [21, 109], "lie": 21, "manual": [21, 23, 24, 50, 51, 52, 53, 54, 136], "aspect": [21, 127, 133], "box2d": [21, 88, 89, 90, 119, 122, 126], "bipedal_walk": [21, 88], "0x7f87d70712d0": 21, "regist": [22, 24, 127], "sole": [22, 127], "special": [22, 27, 57, 141], "gymv26environ": 22, "relev": [22, 118, 132], "pong": [22, 24, 39, 43], "v5": [22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "introduct": [22, 92, 111, 112], "signatur": 22, "previous": [22, 24, 33, 127, 128], "backward": [22, 99, 119, 121, 124, 125, 128, 136, 141], "compliant": [22, 23, 116, 122], "oldv21env": 22, "break": [23, 31, 39, 89, 116, 118, 121, 130], "briefli": 23, "outlin": [23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 111, 119, 139], "still": [23, 24, 122, 127, 130, 134, 136, 139], "stuck": [23, 27, 36, 55], "123": [23, 130], "becaus": [23, 132, 134, 136, 139], "emul": [23, 24, 118], "randint": [23, 119, 127], "utilis": [23, 127], "contrast": 23, "older": [23, 97], "definit": [23, 98, 100, 101, 125, 133], "expand": [23, 24, 50, 51, 52, 53, 54], "blog": [23, 124, 127], "post": [23, 32, 124, 127], "soon": [23, 124, 127, 132], "extra": [23, 28, 33, 34, 36, 40, 42, 55, 74, 109, 116, 130, 132, 139], "address": 23, "associ": [23, 120], "librari": [23, 115, 130, 132], "primari": 23, "shouldn": [23, 132], "happen": [23, 73, 94, 95, 98, 100, 101, 102, 103, 104, 105, 106, 108, 111, 113, 114, 124, 133], "fly": [23, 26, 31, 55, 71, 90], "shown": [23, 59, 89, 92, 133], "explan": [23, 139, 141], "summari": 23, "goalenv": 23, "reimplement": 23, "classic_control": [23, 119, 122], "system": [23, 54, 92, 96, 103, 104, 109, 118], "monitor": [23, 117, 120], "stella": 24, "adventur": [24, 43], "air": [24, 43], "raid": [24, 43], "alien": [24, 43, 45, 65, 78], "amidar": [24, 32, 43], "assault": [24, 43], "asterix": [24, 43], "asteroid": [24, 43], "atlanti": [24, 43], "licens": [24, 109, 118, 136, 139, 141], "download": [24, 132, 133, 134, 136, 137, 139, 141], "locat": [24, 60, 109, 112, 113, 114, 132], "agre": 24, "todo": [24, 114], "legal": [24, 50, 51, 52, 53, 54], "fire": [24, 26, 28, 29, 31, 32, 35, 37, 39, 40, 50, 51, 52, 53, 54, 57, 64, 65, 67, 68, 70, 71, 73, 74, 77, 78, 80, 82, 84, 85, 90], "upright": [24, 30, 31, 35, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 63, 93, 96, 103, 104], "upleft": [24, 30, 31, 35, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 63], "downright": [24, 30, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63], "downleft": [24, 30, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63], "upfir": [24, 28, 31, 37, 50, 51, 52, 53, 54, 68, 80, 81, 82, 84, 85], "11": [24, 31, 50, 51, 52, 53, 54, 58, 61, 98, 99, 100, 101, 102, 103, 105, 106, 108, 111, 112, 136, 139], "rightfir": [24, 26, 28, 29, 31, 32, 35, 40, 50, 51, 52, 53, 54, 58, 61, 64, 65, 67, 77, 80, 81, 84, 85], "leftfir": [24, 26, 28, 29, 31, 32, 40, 50, 51, 52, 53, 54, 58, 61, 64, 65, 67, 77, 80, 81, 84, 85], "13": [24, 31, 50, 51, 52, 53, 54, 58, 61, 98, 99, 101, 102, 105, 108, 114, 130], "downfir": [24, 28, 31, 37, 50, 51, 52, 53, 54, 58, 61, 65, 68, 80, 82, 85], "14": [24, 50, 51, 52, 53, 54, 58, 88, 90, 98, 99, 101, 102, 105, 108, 139], "uprightfir": [24, 31, 50, 51, 52, 53, 54, 58, 61], "upleftfir": [24, 31, 50, 51, 52, 53, 54, 58, 61], "downrightfir": [24, 50, 51, 52, 53, 54, 58, 61], "17": [24, 36, 50, 51, 52, 53, 54, 58, 98, 99, 101, 102, 105, 108, 111], "downleftfir": [24, 50, 51, 52, 53, 54, 58, 61], "smaller": [24, 29, 31, 50, 51, 52, 53, 54], "enumer": [24, 50, 51, 52, 53, 54], "full_action_spac": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "reduc": [24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 93, 136, 139], "difficulti": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 109, 125], "choic": [24, 136, 141], "player": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 109, 111, 112, 113, 114, 139], "128": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 136], "byte": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "ram": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "exact": [24, 37, 50, 51, 52, 53, 54, 111, 139], "atariag": [24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 79, 81, 82, 83, 84, 85, 86], "determinist": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 94, 95, 132, 136], "art": 24, "memor": 24, "sticki": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "small": [24, 54, 73, 88, 109, 110, 116, 119, 120, 121, 130, 141], "On": [24, 65, 92, 93, 94, 95, 96, 122], "top": [24, 39, 44, 51, 57, 59, 73, 89, 90, 91, 94, 95, 100, 103, 104, 108, 119, 124, 125, 132, 141], "frameskip": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "exclus": 24, "tabl": [24, 27, 28, 30, 44, 46, 101, 102, 105, 123], "obs_typ": 24, "Its": 24, "stick": [24, 33, 55, 111, 139], "ll": [24, 57, 74, 127, 136, 139], "sound": 24, "lock": 24, "proper": [24, 118, 127], "audio": 24, "framer": [24, 102, 105, 106, 132], "best": [24, 50, 51, 52, 53, 54, 136, 139], "practic": [24, 50, 51, 52, 53, 54, 109, 124, 133, 139], "configur": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 91, 97, 110, 132, 136, 139], "let": [24, 39, 109, 132, 134, 139, 141], "variat": 24, "amidardeterminist": 24, "amidarnoframeskip": 24, "ramdeterminist": 24, "ramnoframeskip": 24, "suffix": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "noframeskip": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "airraid": [24, 26], "31": [24, 31, 101, 102, 130], "bankheist": [24, 33], "20": [24, 33, 39, 66, 74, 90, 98, 101, 102, 105, 114, 118, 130, 136, 139], "battlezon": [24, 34], "beamrid": [24, 35], "berzerk": [24, 43], "18": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 101, 102, 105, 108, 116], "bowl": [24, 43], "breakout": [24, 43], "36": [24, 39, 101, 102, 112], "40": [24, 39, 64, 101, 102], "44": [24, 39, 101, 102], "carniv": [24, 43], "centiped": [24, 43], "22": [24, 41, 98, 101, 102, 105, 120, 122, 127, 130, 139], "86": [24, 41], "choppercommand": [24, 42], "crazyclimb": [24, 44], "defend": [24, 32, 43, 48, 64, 76], "demonattack": [24, 46], "doubledunk": [24, 47], "elevatoract": [24, 48], "enduro": [24, 43], "fishingderbi": 24, "freewai": [24, 43], "frostbit": [24, 43], "gopher": [24, 43], "gravitar": [24, 43], "hero": [24, 43], "icehockei": 24, "jamesbond": [24, 43], "journeyescap": 24, "kangaroo": [24, 43], "krull": [24, 43], "kungfumast": [24, 61], "montezumareveng": [24, 62], "mspacman": [24, 63], "namethisgam": [24, 64], "phoenix": [24, 43], "pitfal": [24, 43, 88], "pooyan": [24, 43], "50": [24, 58, 68, 74, 90, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 141], "70": [24, 68, 130], "privateey": 24, "qbert": [24, 43], "riverraid": [24, 43], "roadrunn": [24, 72], "robotank": [24, 43, 73], "seaquest": [24, 43], "ski": [24, 43], "solari": [24, 43], "spaceinvad": 24, "stargunn": 24, "tenni": [24, 43], "timepilot": 24, "tutankham": [24, 43], "upndown": [24, 82], "ventur": [24, 43], "videopinbal": [24, 84, 85], "wizardofwor": [24, 85], "yarsreveng": 24, "zaxxon": [24, 43], "oppos": 24, "ai": [24, 109], "mg": 24, "bellemar": 24, "naddaf": 24, "j": [24, 136, 141], "veness": 24, "platform": 24, "journal": [24, 114], "artifici": [24, 114], "intellig": [24, 114, 119], "research": [24, 97, 103, 114], "2012": 24, "url": [24, 127, 136], "jair": [24, 114], "php": 24, "articl": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "view": [24, 54], "11182": 24, "250": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 130], "160": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 130], "enchant": [25, 41], "chalic": 25, "golden": 25, "castl": 25, "pick": [25, 48, 59, 72, 114, 136, 139], "sword": 25, "bridg": [25, 71, 109], "magnet": 25, "fight": [25, 38, 61, 64, 109], "outmanoeuvr": 25, "dragon": 25, "flavor": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "switch": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 109, 116, 130], "thorough": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "discuss": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 119, 130], "intric": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "stochast": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 91, 92, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 112, 114, 117], "ship": [26, 27, 29, 35, 45, 54, 76], "sidewai": [26, 29, 35, 71, 75], "protect": [26, 32, 41, 42, 53, 58, 68], "saucer": [26, 31, 78], "try": [26, 27, 28, 37, 39, 44, 67, 68, 122, 129, 130, 139], "drop": [26, 33, 114, 130], "bomb": [26, 45, 57, 65, 78], "those": [26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 92, 97, 98, 99, 100, 101, 102, 103, 104, 108, 124, 127, 134, 136], "meaning": [26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85], "210": [27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 45, 46, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "maze": [27, 28, 33, 36, 62, 81], "egg": 27, "scatter": [27, 69], "simultan": [27, 28], "kill": [27, 36, 55, 60], "flamethrow": 27, "awai": [27, 67, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 134], "tricki": 27, "situat": [27, 114], "occasion": [27, 31], "pulsar": 27, "temporari": 27, "abil": [27, 130], "score": [27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 74, 78, 79, 80, 84, 88, 90], "prize": [27, 82], "caught": [27, 33, 125], "lose": [27, 30, 32, 41, 44, 45, 48, 55, 57, 66, 67, 69, 71, 72, 74, 75, 76, 90, 111, 139], "consult": [27, 56, 57, 58, 59, 60], "pac": 28, "man": 28, "visit": [28, 48, 89], "grid": [28, 112, 113, 114, 132, 139], "chicken": [28, 40, 51], "catch": [28, 44, 50, 72], "travers": 28, "vehicl": [29, 34, 49, 58], "big": [29, 50, 132], "mother": [29, 59, 68], "circl": [29, 132], "overhead": [29, 90], "deploi": 29, "drone": 29, "dodg": [29, 35, 74], "attack": [29, 31, 32, 35, 43, 45, 68], "horizont": [30, 40, 88, 90, 92, 132], "vertic": [30, 88, 103, 104, 132], "lyre": 30, "guid": [30, 51, 109, 130], "suffici": [30, 32, 34, 36, 41, 139], "award": [30, 36, 41, 44, 48, 74, 103, 104], "field": 31, "appear": [31, 33, 36, 73, 94, 95], "satellit": 31, "ufo": 31, "job": [32, 132], "submerg": 32, "citi": [32, 33, 69], "slowli": 32, "descend": 32, "toward": [32, 56, 107, 119], "strike": [32, 37], "distanc": [32, 49, 99, 132], "defens": [32, 47], "manag": [32, 37], "seven": 32, "fought": 32, "wave": [32, 42, 46, 58, 65, 78], "outer": [32, 92], "robber": 33, "natur": [33, 111, 113, 139], "rob": 33, "getawai": 33, "navig": [33, 69, 114, 132, 134], "polic": 33, "chase": [33, 36], "dynamit": [33, 55], "ga": [33, 89], "tank": [33, 34, 74], "nine": [33, 98], "leav": [33, 93, 97, 103, 132], "person": [34, 92, 109], "perspect": [34, 109], "3d": [34, 98, 101, 102, 109, 139], "illus": 34, "radar": [34, 85], "gain": [34, 70, 76, 77, 80, 134], "travel": 35, "steer": [35, 82, 89], "debri": 35, "leftifir": 35, "evil": [36, 61, 86], "touch": [36, 69, 132], "wall": [36, 39, 55, 94, 95, 114], "undefeat": 36, "otto": 36, "tri": 37, "knock": [37, 38], "pin": 37, "spar": 37, "spare": 37, "300": [37, 49, 88, 132], "oppon": [38, 50, 56, 67, 82], "ring": 38, "hit": [38, 39, 40, 41, 46, 68, 69, 72, 73, 75, 111, 139], "punch": [38, 59], "famou": 39, "paddl": [39, 67], "ball": [39, 56, 67, 84], "brick": 39, "wreak": 39, "havoc": 39, "five": [39, 69, 75, 91, 124, 141], "214": 40, "em": 40, "target": [40, 92, 105, 106, 132, 133, 134, 136], "gun": [40, 48], "suppli": [40, 64, 133], "ammunit": 40, "steal": [40, 50], "bullet": [40, 109], "subtract": [40, 136], "minu": 40, "sign": [40, 103, 104, 141], "elf": [41, 113], "magic": 41, "wand": 41, "fend": 41, "spider": 41, "flea": 41, "mushroom": 41, "forest": 41, "bitten": 41, "tempor": 41, "paralyz": 41, "scorpion": 41, "round": 41, "helicopt": [42, 44, 71], "truck": [42, 72], "convoi": 42, "aircraft": [42, 80], "mini": 42, "bottom": [42, 57, 89, 94, 95, 100, 108, 112], "plane": 42, "surviv": [42, 46], "bank": [43, 71], "heist": 43, "battl": 43, "zone": 43, "beam": [43, 55], "rider": 43, "chopper": 43, "command": [43, 97], "crazi": 43, "climber": 43, "demon": 43, "doubl": [43, 97], "dunk": 43, "elev": 43, "fish": 43, "derbi": 43, "ic": [43, 46, 52, 56, 113], "hockei": [43, 56], "journei": [43, 58, 127, 139], "kung": 43, "fu": 43, "master": [43, 112, 118, 141], "montezuma": 43, "reveng": 43, "pacman": 43, "privat": [43, 69, 132], "ey": [43, 64, 69], "road": [43, 89], "runner": 43, "invad": [43, 77], "star": 43, "gunner": 43, "pilot": [43, 65, 86], "pinbal": 43, "wizard": [43, 61], "Of": 43, "wor": 43, "yar": 43, "builid": 44, "obstacl": [44, 58, 59], "fall": [44, 46, 66, 72, 88, 101, 112, 113, 133], "damag": [44, 73], "climb": [44, 59, 91], "fast": [44, 89, 97, 99, 101, 103, 107, 109], "least": [44, 79, 90], "row": [44, 77, 112, 113], "earth": [45, 77], "rescu": [45, 55, 59, 60, 61, 74, 76], "smart": 45, "shot": [45, 47, 48, 56, 57, 72, 109], "abduct": 45, "unlimit": 45, "laser": [45, 55, 77, 85], "missil": [45, 71], "aliv": [45, 101, 108], "face": [46, 98, 101, 102, 111, 139], "planet": [46, 54, 76], "krybor": 46, "accumul": 46, "reserv": [46, 71, 73, 74], "bunker": [46, 54], "increas": [46, 74, 90, 92, 93, 100, 107, 108, 136, 139], "grant": [46, 90], "slai": 46, "2v2": 47, "basketbal": 47, "possess": 47, "rival": 47, "team": [47, 117], "rule": [47, 79, 109, 111, 139], "foul": 47, "success": [47, 92, 114, 130, 133], "secret": [48, 69], "ground": [48, 68, 88, 90, 98, 102, 109], "stair": 48, "equip": 48, "against": [48, 67, 79, 109, 123], "floor": 48, "gather": [48, 69, 132], "apart": [48, 132], "mark": 48, "red": [48, 54, 114, 122, 132], "door": 48, "unreleas": 48, "prototyp": 48, "500": [48, 71, 92, 93, 114, 127, 136, 139], "racer": 49, "nation": 49, "long": [49, 84, 93, 103, 104, 117, 130], "endur": 49, "race": [49, 72, 75, 87, 122, 124], "overtak": 49, "dai": [49, 87], "stai": [49, 136], "meet": 49, "quota": 49, "sunfish": 50, "But": [50, 75, 98], "fisherman": 50, "black": [50, 60, 92, 116, 122, 139], "shark": [50, 64, 74], "lurk": [50, 70], "surfac": [50, 74, 103, 104, 132], "lane": [51, 109], "busi": 51, "rush": 51, "hour": 51, "traffic": [51, 109], "cross": [51, 112, 113], "bailei": 52, "who": [52, 53, 58, 59, 75, 130], "hop": [52, 70, 100, 108], "forth": 52, "arctic": 52, "river": [52, 71], "block": 52, "white": [52, 122], "blue": [52, 54, 79, 92, 114, 132], "he": [52, 54], "hi": [52, 54, 69], "igloo": 52, "shovel": 53, "wield": 53, "farmer": 53, "crop": 53, "carrot": 53, "spacecraft": 54, "fiction": 54, "solar": 54, "landscap": 54, "miner": 55, "mine": [55, 72], "shaft": 55, "tool": [55, 62], "propel": 55, "backpack": 55, "wherev": 55, "blast": [55, 74, 76], "vermin": 55, "raft": 55, "stretch": 55, "critter": 55, "standard": [56, 98, 99, 103, 109, 117, 118, 119, 120, 136, 141], "minut": [56, 66], "period": [56, 100, 108], "puck": 56, "angl": [56, 57, 88, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 128], "extrem": [56, 109, 110], "rink": 56, "realli": [56, 139], "mr": 57, "bond": 57, "design": [57, 92, 98, 101, 102, 109, 110, 114, 132], "multipurpos": 57, "craft": [57, 90], "varieti": [57, 109], "motion": [57, 109], "slightli": [57, 88, 98], "jump": [57, 72, 75], "dive": 57, "lob": 57, "rate": [57, 74, 136, 139, 141], "highest": 57, "novic": 57, "006": 57, "007": 57, "lead": [58, 136], "peski": 58, "backstag": 58, "scarab": 58, "000": [58, 71, 74], "concert": 58, "cash": 58, "grasp": 58, "groupi": 58, "photograph": 58, "promot": 58, "encount": [58, 59, 80], "her": [59, 68], "preciou": 59, "babi": 59, "ladder": [59, 88], "bonu": [59, 73, 74, 78, 108, 136], "fruit": 59, "throw": [59, 134], "monkei": 59, "corner": 59, "beast": 60, "fortress": [60, 62], "princess": [60, 61], "lyssa": 60, "sunris": 60, "monster": [60, 83], "templ": 61, "victoria": 61, "defeat": [61, 70], "acquir": [62, 97], "treasur": [62, 64, 66, 81, 83], "chamber": [62, 83], "emperor": 62, "deadli": 62, "creatur": [62, 70, 78, 109], "valuabl": 62, "pellet": 63, "ghost": 63, "discov": 64, "octopu": 64, "oxygen": [64, 74], "elimin": [65, 81, 82, 83], "war": 65, "bird": 65, "harri": 66, "jungl": 66, "die": [66, 68, 89], "misfortun": 66, "hole": [66, 113], "compet": 67, "deflect": 67, "pig": 68, "piglet": 68, "wolv": 68, "rope": 68, "balloon": 68, "guard": 68, "eat": [68, 72], "bait": 68, "wolf": 68, "stone": 68, "rock": [68, 72], "french": 69, "pierr": 69, "street": 69, "park": 69, "passag": 69, "dead": [69, 116, 120, 130], "search": 69, "ringlead": 69, "henri": 69, "le": 69, "fiend": 69, "gang": 69, "evid": 69, "stolen": 69, "good": [69, 136, 139], "statut": 69, "expir": 69, "nab": 69, "question": [69, 109], "auto": [69, 130], "pothol": 69, "q": [70, 114, 133, 136, 137, 140], "bert": 70, "pyramid": 70, "destin": [70, 114], "nasti": 70, "jet": 71, "fli": 71, "fuel": [71, 76, 90], "depot": 71, "collid": [71, 74, 90], "squadron": [71, 73], "tanker": 71, "80": [71, 113], "tm": 72, "direct": [72, 74, 92, 93, 94, 95, 98, 100, 101, 103, 104, 108, 112, 113, 114, 132, 141], "outrun": 72, "wile": 72, "coyot": 72, "hazard": 72, "desert": 72, "rocket": [72, 73, 90], "cannon": [72, 77], "cliff": [72, 110], "steel": 72, "pile": 72, "birdse": 72, "cannonbal": 72, "activ": [73, 132], "scrambl": 73, "static": 73, "interfer": 73, "sensor": [73, 89], "report": [73, 88, 98, 101, 102, 124, 130], "flash": 73, "panel": 73, "c": [73, 90, 92, 130, 141], "earn": 73, "twelv": 73, "abl": [74, 130, 133], "torpedo": 74, "diver": 74, "killer": 74, "deliv": [74, 114], "six": [74, 108], "explod": 74, "anyth": 74, "decreas": [74, 90], "almost": [74, 127], "yoursub": 74, "blow": 74, "forc": [74, 76, 90, 93, 94, 95, 98, 101, 102, 103, 104, 117, 141], "less": [74, 88, 90, 103, 107], "worth": [74, 77], "90": [74, 139], "skier": 75, "gate": 75, "fastest": 75, "penal": [75, 134], "tree": 75, "slalom": 75, "penalti": [75, 114], "warp": 76, "sector": 76, "feder": 76, "zylon": 76, "refuel": 76, "cadet": 76, "corridor": 76, "mania": [78, 80], "orang": 79, "win": [79, 111, 139], "margin": 79, "ti": 79, "sport": 79, "till": [79, 136, 139], "technologi": 80, "increasingli": 80, "difficult": [80, 93, 97, 103, 104], "rack": 81, "tomb": 81, "guardian": 81, "baja": 82, "bugger": 82, "dungeon": 83, "beat": [85, 111], "scanner": 85, "armi": 86, "enslav": 86, "galaxi": 86, "fighter": 86, "biped": [87, 101, 102, 117, 119, 122], "walker": [87, 97, 106, 108, 117, 119, 122], "lunar": [87, 119, 122, 125], "lander": [87, 119, 122, 125], "toi": [87, 111, 112, 113, 114, 117], "contribut": [87, 130], "earli": [87, 139, 141], "oleg": [87, 88, 89, 90], "klimov": [87, 88, 89, 90], "popular": [87, 109, 139], "benchmark": 87, "ever": [87, 119], "joint": [88, 90, 92, 93, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "uneven": 88, "terrain": [88, 109], "hardcor": 88, "stump": 88, "1600": 88, "heurist": [88, 90], "demonstr": [88, 109], "motor": [88, 107, 127], "hip": [88, 98, 101, 102], "knee": [88, 101, 102], "hull": 88, "angular": [88, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "leg": [88, 90, 98, 100, 101, 102, 108], "contact": [88, 90, 97, 98, 101, 102, 103, 122], "lidar": 88, "rangefind": 88, "measur": [88, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 117], "far": [88, 89, 103, 105, 106, 113], "torqu": [88, 92, 96, 98, 99, 100, 101, 102, 105, 106, 107, 108], "cost": [88, 99, 100, 107, 108, 109], "better": [88, 117, 130, 136], "stand": [88, 97, 98, 101, 102, 103, 104, 130, 139], "slight": 88, "exce": [88, 111], "closest": 88, "trace": 88, "furthest": 88, "faster": [88, 90, 102, 136], "energi": [88, 90, 93, 109, 134], "spent": [88, 90], "friction": [88, 107, 109], "nervous": 88, "easiest": [89, 118], "ab": [89, 136], "wheel": [89, 128], "gyroscop": 89, "car_rac": [89, 119], "rear": 89, "drive": 89, "brake": 89, "96x96": 89, "tile": 89, "732": 89, "926": 89, "rest": [89, 90, 100, 108, 136], "playfield": 89, "lap_complete_perc": 89, "dictat": [89, 90], "percentag": [89, 139], "lap": [89, 124], "domain_random": 89, "variant": [89, 132], "scenario": [89, 109], "background": 89, "demand": 89, "correspondingli": 89, "init": [89, 132, 136], "scheme": [89, 109], "chri": 89, "campbel": 89, "2014": 89, "www": [89, 111, 112, 113, 119, 127], "iforce2d": 89, "net": [89, 111, 112, 136, 141], "b2dtut": 89, "pontryagin": 90, "principl": 90, "engin": [90, 97, 130], "throttl": 90, "why": 90, "pad": 90, "infinit": [90, 100, 108, 111, 122, 133, 139], "lunar_land": 90, "orient": [90, 98, 101, 102], "sum": [90, 98, 99, 100, 101, 102, 105, 106, 107, 108, 111, 139], "closer": [90, 111], "slower": [90, 136], "tilt": 90, "03": 90, "solut": [90, 139], "viewport": 90, "mass": [90, 98, 99, 101, 102, 107], "bodi": [90, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108], "moon": 90, "greater": [90, 92, 93, 94, 95, 99, 104, 105, 107, 111, 139], "awak": 90, "group": [90, 123], "come": [90, 98, 99, 100, 101, 102, 103, 104, 107, 108], "sleep": 90, "littl": [90, 102, 130], "cpu": [90, 136], "wake": 90, "attach": [90, 93, 96, 98, 108], "graviti": [90, 93, 94, 96, 103, 104, 136, 141], "enable_wind": [90, 136], "wind_pow": [90, 122, 136], "turbulence_pow": [90, 136], "later": [90, 136, 139, 141], "booster": 90, "gravit": 90, "wind": [90, 122], "tanh": [90, 141], "sin": [90, 96, 103, 106], "pi": [90, 92, 96], "9999": 90, "rotat": [90, 92, 98, 101, 102, 105, 125, 139], "turbul": [90, 122], "renorm": 90, "harder": 90, "push": [90, 93, 103, 104, 109, 141], "cart": [91, 103, 104, 141], "nois": [91, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "regard": 91, "underpow": 91, "effort": [91, 130], "easier": [91, 118, 126, 136], "ones": [91, 97, 118, 136, 139], "57": [92, 136], "spars": [92, 132], "coars": 92, "barto": [92, 93, 103, 104, 111, 112, 117, 139], "book": [92, 111, 112, 117, 139], "link": [92, 98, 99, 100, 101, 102, 106, 107, 130], "actuat": [92, 93, 101, 102], "swing": [92, 96], "free": [92, 96, 97, 98, 101, 102, 103, 104, 109, 139, 141], "height": [92, 100, 103, 108, 127], "hang": [92, 126], "downward": 92, "seen": [92, 99], "green": [92, 114], "cosin": [92, 103, 106], "theta1": 92, "sine": [92, 103, 106], "theta2": 92, "567": 92, "274": [92, 130], "rel": [92, 101, 102, 132, 134, 136], "4\u03c0": 92, "9\u03c0": 92, "rad": [92, 93, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "incur": [92, 112, 114], "co": [92, 94, 95, 96, 103, 106, 109], "book_or_nip": 92, "neurip": 92, "paper": [92, 103, 114], "nip": 92, "equat": [92, 96], "present": [92, 109, 124, 132, 133, 139], "confirm": [92, 118], "radian": [92, 93, 96, 104], "1996": 92, "touretzki": 92, "mozer": 92, "hasselmo": 92, "ed": 92, "vol": [92, 114], "mit": [92, 136, 139, 141], "proceed": 92, "cc": 92, "1995": 92, "8f1d43620bc6bb580df6e80b0dc05c48": 92, "pdf": [92, 111, 112], "anderson": [93, 103, 104], "neuronlik": [93, 103, 104], "adapt": [93, 103, 104, 112], "un": 93, "frictionless": 93, "balanc": [93, 103, 104, 136, 141], "vari": [93, 103, 104, 141], "418": 93, "untermin": 93, "2095": 93, "allot": 93, "475": 93, "05": [93, 98, 99, 105, 130], "07": [94, 95], "sinusoid": [94, 95], "vallei": [94, 95], "strateg": [94, 95], "hill": [94, 95], "andrew": [94, 95], "moor": [94, 95], "phd": [94, 95, 107], "thesi": [94, 95, 107], "1990": [94, 95], "techreport": [94, 95], "moore90efficientmemori": [94, 95], "author": [94, 95, 109, 136, 139, 141], "william": [94, 95, 141], "institut": [94, 95], "univers": [94, 95], "cambridg": [94, 95], "year": [94, 95, 124], "001": [94, 96, 100, 103, 108, 136, 139], "0025": [94, 95], "collis": [94, 95, 126], "inelast": [94, 95], "upon": [94, 95], "quickli": [94, 139], "penalis": [94, 95, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108], "0015": 95, "45": [95, 102, 105], "999": [95, 136], "invert": [96, 97, 141], "swingup": 96, "diagram": 96, "meter": 96, "theta": [96, 128], "tau": 96, "counter": 96, "clockwis": 96, "theta_dt": 96, "heta": 96, "2736044": 96, "math": [96, 123], "half": 97, "cheetah": 97, "standup": 97, "facilit": [97, 109], "biomechan": 97, "graphic": [97, 109, 119], "anim": 97, "area": 97, "accur": 97, "octob": 97, "2021": [97, 109], "deepmind": [97, 122], "2022": [97, 124, 130], "everyon": 97, "instruct": [97, 132], "websit": [97, 109, 118, 119, 127, 130], "github": [97, 112, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 132], "framework": 97, "ten": [97, 111, 139], "iverteddoublependulum": 97, "gaussian": 97, "mjsim": 97, "qpo": 97, "qvel": [97, 101, 102], "indirectli": 97, "xml": [97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 123, 130], "tweak": [97, 107], "schulman": [98, 136], "moritz": [98, 136], "levin": [98, 136], "jordan": [98, 136], "abbeel": [98, 136], "advantag": [98, 109, 132], "estim": [98, 133, 136, 141], "torso": [98, 99, 100, 101, 102, 108], "eight": 98, "hing": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "rotor": [98, 99, 100, 101, 102, 107, 108], "hip_4": 98, "right_back_leg": 98, "angle_4": 98, "front": [98, 99, 107], "hip_1": 98, "front_left_leg": 98, "angle_1": 98, "hip_2": 98, "front_right_leg": 98, "angle_2": 98, "hip_3": 98, "back_leg": 98, "angle_3": 98, "deriv": [98, 99, 100, 101, 102, 103, 104, 107, 108, 141], "exclude_current_positions_from_observ": [98, 99, 100, 101, 107, 108], "29": [98, 101, 102], "regardless": [98, 99, 100, 101, 107, 108], "x_posit": [98, 99, 100, 101, 107, 108], "y_posit": [98, 101, 107], "z": [98, 99, 100, 101, 102, 105, 106, 108], "centr": [98, 101, 102], "ankle_1": 98, "ankle_2": 98, "ankle_3": 98, "ankle_4": 98, "19": [98, 101, 102, 105, 117, 130, 136], "23": [98, 101, 102, 105, 109, 122, 130], "use_contact_forc": [98, 130], "translat": [98, 101, 102, 130, 132], "dof": [98, 101, 102], "quaternion": [98, 101, 102], "healthy_reward": [98, 100, 101, 108], "healthi": [98, 100, 101, 108], "forward_reward": [98, 99, 100, 101, 107, 108], "dt": [98, 99, 100, 101, 105, 106, 107, 108], "frametim": [98, 99, 100, 101, 107, 108], "ctrl_cost": [98, 99, 100, 101, 107, 108], "too": [98, 99, 100, 101, 102, 103, 105, 106, 107, 108], "ctrl_cost_weight": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "ctr_cost_weight": 98, "contact_cost": [98, 101], "contact_cost_weight": [98, 101], "contact_force_rang": 98, "reset_noise_scal": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "deviat": [98, 99, 103, 107, 136, 141], "intention": [98, 101, 102], "therebi": [98, 101, 102], "unhealthi": [98, 100, 101, 108], "healthy_z_rang": [98, 100, 101, 108], "terminate_when_unhealthi": [98, 100, 101, 108], "xml_file": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "path": [98, 99, 100, 101, 105, 106, 107, 108, 113, 136], "model": [98, 99, 100, 101, 107, 108, 109, 130, 139], "weight": [98, 99, 100, 101, 105, 106, 107, 108, 109, 127, 133, 134, 141], "5e": [98, 100, 101, 108], "perturb": [98, 99, 100, 101, 107, 108], "induct": [98, 99, 100, 101, 107, 108], "bia": [98, 99, 100, 101, 107, 108, 136], "induc": [98, 99, 100, 101, 107, 108], "agnost": [98, 99, 100, 101, 102, 107, 108], "bind": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 122], "restor": 98, "camera": [98, 99, 100, 101, 102, 103, 104, 107, 108], "max_time_step": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "p": [99, 109, 112, 113, 114, 136], "wawrzy\u0144ski": 99, "cat": 99, "paw": 99, "alloc": 99, "thigh": [99, 100, 101, 102, 108], "shin": [99, 101, 102], "feet": [99, 108], "bthigh": 99, "bshin": 99, "bfoot": 99, "fthigh": 99, "fshin": 99, "ffoot": 99, "tip": [99, 103, 107], "rootz": [99, 100, 108], "slide": [99, 100, 103, 104, 105, 106, 107, 108], "rooti": [99, 100, 108], "rootx": [99, 100, 108], "forward_reward_weight": [99, 100, 101, 107, 108], "half_cheetah": 99, "erez": [100, 101, 102, 108], "tassa": [100, 101, 102, 108], "todorov": [100, 101, 102, 108], "predict": [100, 108, 136, 141], "nonlinear": [100, 108], "compar": [100, 107, 108, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 136, 139], "figur": [100, 108, 139, 141], "middl": [100, 108], "thigh_joint": [100, 108], "leg_joint": [100, 108], "foot_joint": [100, 108], "008": [100, 108], "els": [100, 108, 113, 132, 136, 139], "healthy_state_rang": 100, "fallen": 100, "healthy_angle_rang": [100, 108], "376": [101, 102], "synthesi": [101, 102], "onlin": [101, 102, 109, 111, 112], "abdomen": [101, 102], "pair": [101, 102], "arm": [101, 102, 105, 106, 109], "elbow": [101, 102, 105], "walk": [101, 108, 110, 113, 132], "abdomen_i": [101, 102], "abdomen_z": [101, 102], "abdomen_x": [101, 102], "right_hip_x": [101, 102], "right_thigh": [101, 102], "right_hip_z": [101, 102], "right_hip_i": [101, 102], "right_kne": [101, 102], "left_hip_x": [101, 102], "left_thigh": [101, 102], "left_hip_z": [101, 102], "left_hip_i": [101, 102], "left_kne": [101, 102], "right_shoulder1": [101, 102], "right_shoulder2": [101, 102], "right_elbow": [101, 102], "left_shoulder1": [101, 102], "left_shoulder2": [101, 102], "left_elbow": [101, 102], "378": 101, "root": [101, 102, 130], "lower_waist": [101, 102], "pelvi": [101, 102], "right_upper_arm": [101, 102], "right_lower_arm": [101, 102], "left_upper_arm": [101, 102], "left_lower_arm": [101, 102], "anglular": [101, 102, 104], "aanglular": [101, 102], "33": [101, 102], "34": 101, "35": [101, 102, 130], "37": [101, 102, 130], "39": [101, 102, 130], "41": [101, 102, 130], "43": [101, 102], "velocitti": 101, "cinert": [101, 102], "inertia": [101, 102], "rigid": [101, 102], "intermedi": [101, 102], "nbodi": [101, 102], "henc": [101, 102, 110, 141], "140": [101, 102], "cvel": [101, 102], "qfrc_actuat": [101, 102], "constraint": [101, 102, 103, 109], "nv": [101, 102], "cfrc_ext": [101, 102], "freedom": [101, 102, 103, 134], "dim": [101, 102], "003": 101, "015": 101, "nu": [101, 102], "contact_cost_rang": 101, "lai": 102, "numer": [102, 103, 104, 111, 116, 130, 134, 141], "state_spac": 102, "uph_cost": 102, "upward": 102, "absolut": [102, 104, 108], "overal": 102, "atom": 102, "movement": [102, 132], "though": [102, 117, 119], "inflat": 102, "quad_ctrl_cost": 102, "quad_impact_cost": 102, "000001": 102, "105": [102, 130], "unlik": [102, 103, 104, 105, 106, 141], "beyond": [102, 103, 104, 105, 106, 108, 130], "slider": [103, 104], "unitless": [103, 106], "hinge2": 103, "realist": [103, 109], "accuraci": 103, "approach": [103, 117, 132, 139, 141], "analyt": 103, "alive_bonu": 103, "distance_penalti": 103, "velocity_penalti": 103, "005": [103, 105, 106, 136], "y_coordin": 103, "196": 103, "perpendicularli": 103, "cylind": 105, "effector": [105, 106], "fingertip": [105, 106], "shoulder": 105, "forearm": 105, "wrist": 105, "pan": 105, "r_shoulder_pan_joint": 105, "lift": 105, "r_shoulder_lift_joint": 105, "r_upper_arm_roll_joint": 105, "flex": 105, "r_elbow_flex_joint": 105, "r_forearm_roll_joint": 105, "r_wrist_flex_joint": 105, "r_wrist_roll_joint": 105, "analogi": 105, "tips_arm": 105, "obj_slidex": 105, "obj_slidei": 105, "goal_slidex": 105, "goal_slidei": 105, "sphere": 105, "reward_near": 105, "unattach": [105, 106], "reward_dist": [105, 106, 134], "reward_control": [105, 106], "euclidean": [105, 106], "reward_ctrl": [105, 106, 134], "perman": 105, "323": 105, "rise": 105, "modif": [105, 106, 134], "asset": [105, 106, 109, 113], "gymnasmium": 105, "fixtur": 106, "joint0": 106, "joint1": 106, "target_x": 106, "target_i": 106, "position_fingertip": 106, "position_target": 106, "na": 106, "constantli": 106, "2d": [106, 134], "disk": 106, "radiu": 106, "everyth": 106, "02": 106, "r\u00e9mi": 107, "coulom": 107, "applic": [107, 109], "segment": 107, "articul": [107, 109], "suspend": 107, "subject": 107, "fluid": 107, "viscou": 107, "coeffici": [107, 136], "motor1_rot": 107, "motor2_rot": 107, "\u03b8": 107, "free_body_rot": 107, "slider1": 107, "slider2": 107, "04": 107, "swim": 107, "split": [108, 130], "thigh_left_joint": 108, "leg_left_joint": 108, "foot_left_joint": 108, "ctr_cost": 108, "procedur": [109, 141], "clone": [109, 132], "huge": [109, 119, 127], "3v3": 109, "hundr": 109, "roughli": 109, "tweakabl": 109, "monei": 109, "slime": 109, "volleybal": 109, "motiv": 109, "premad": 109, "foss": 109, "interoper": 109, "extens": [109, 141], "light": 109, "poli": 109, "pinocchio": 109, "meshcat": 109, "web": 109, "bitcraz": 109, "crazyfli": 109, "nanoquadrotor": 109, "endeavor": 109, "gap": 109, "deep": [109, 124, 133, 136, 141], "methodologi": 109, "coverag": 109, "laboratori": 109, "internet": 109, "quadrotor": 109, "casadi": 109, "symbol": 109, "priori": 109, "isaac": 109, "omnivers": 109, "cours": 109, "wide": 109, "account": [109, 126], "yield": 109, "voltag": 109, "duti": 109, "cycl": 109, "emphasi": 109, "percept": 109, "social": 109, "driver": 109, "whose": [109, 111], "uncertain": 109, "merg": [109, 130], "intersect": 109, "roundabout": 109, "latent": 109, "transfer": 109, "miniatur": 109, "racecar": 109, "llvm": 109, "phase": [109, 136], "gcc": 109, "cuda": [109, 136], "p_0": 109, "morl": 109, "cell": [109, 112, 132], "warehous": 109, "storag": 109, "overfit": [109, 136], "predefin": [109, 132], "hyperparamet": [109, 136, 139, 141], "cheap": 109, "surrog": 109, "evolutionari": 109, "tag": [109, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129], "answer": 109, "classif": 109, "dataset": 109, "autom": [109, 118], "prover": 109, "vampir": 109, "theoret": [109, 124], "workshop": 109, "minatari": 109, "bsuit": 109, "great": [109, 134, 139], "focu": [109, 136], "simplic": 109, "comprehens": [109, 119], "crypto": 109, "omg": 109, "toolbox": 109, "minimalist": 109, "synthes": 109, "neuro": 109, "architectur": 109, "integr": 109, "twin": 109, "concept": 109, "seamless": 109, "firmwar": 109, "neuroflight": 109, "frozen": [110, 119, 130], "lake": [110, 119, 130], "suitabl": 110, "card": [111, 139], "dealer": [111, 124, 139], "deck": [111, 139], "jack": 111, "queen": 111, "king": 111, "ac": [111, 139], "usabl": [111, 119, 139], "held": 111, "decid": 111, "bust": [111, 139], "reveal": 111, "facedown": 111, "goe": [111, 127], "outcom": 111, "hand": [111, 141], "sab": [111, 139], "2020": [111, 112], "incompleteidea": [111, 112], "rlbook2020": [111, 112], "48": 112, "4x12": 112, "world": [112, 113, 114], "132": [112, 130], "inspir": 112, "com": [112, 113, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 132, 141], "dennybritz": 112, "blob": [112, 118], "cliff_walk": 112, "latter": 112, "current_row": [112, 113], "nrow": [112, 113, 136], "current_col": [112, 113], "col": [112, 113], "47": 112, "proabil": [112, 114], "slipperi": 113, "extent": 113, "4x4": 113, "perpendicular": 113, "sometim": [113, 132, 134], "is_slipperi": 113, "stool": 113, "franuka": 113, "itch": 113, "io": 113, "rpg": 113, "snow": 113, "tileset": 113, "mel": 113, "tilleri": 113, "cyaneu": 113, "ncol": [113, 136, 139], "time_limit": [113, 114], "8x8": 113, "desc": 113, "map_nam": 113, "preload": 113, "sfff": 113, "fhfh": 113, "fffh": 113, "hffg": 113, "generate_random_map": 113, "toy_text": [113, 116, 119, 127, 139], "frozen_lak": 113, "sfffffff": 113, "ffffffff": 113, "fffhffff": 113, "fffffhff": 113, "fhhfffhf": 113, "fhffhfhf": 113, "fffhfffg": 113, "bug": [113, 119, 120, 121, 122, 130], "passeng": 114, "yellow": 114, "5x5": 114, "maxq": 114, "decomposit": 114, "tom": 114, "dietterich": 114, "pickup": 114, "south": 114, "north": 114, "east": 114, "west": 114, "letter": [114, 122], "taxi_row": 114, "taxi_col": 114, "passenger_loc": 114, "actual": [114, 132, 136], "404": 114, "reachabl": 114, "illeg": 114, "action_mask": 114, "fickl": 114, "Or": 114, "argmax": [114, 139], "q_valu": [114, 139], "pp": 114, "227": 114, "303": 114, "nov": 114, "doi": 114, "1613": 114, "639": 114, "cleaner": 114, "disallow": 114, "loc": [114, 136], "passidx": 114, "maintain": [115, 116, 130], "capabl": [115, 127], "insert": [115, 141], "mainten": [116, 127], "jkterry1": [116, 117], "becam": 116, "datatyp": 116, "orsini": 116, "complianc": 116, "sb3": 116, "amtamasi": 116, "recordepisodestat": 116, "vwxyzjn": [116, 117, 119, 120, 121], "unus": [116, 117, 120], "unnescesari": 116, "newer": 116, "machin": [116, 127, 141], "notabl": [116, 130, 133], "peg": 116, "pend": 116, "bump": [116, 117, 118, 119, 122, 124, 127], "zhiqingxiao": [116, 121, 125], "depreci": 116, "pirata": 116, "mahiuchun": 116, "zlig": [116, 118], "ez": 116, "pickl": [116, 126, 129, 130], "zzyunzhi": 116, "jamesborg46": 116, "minor": [116, 117, 118, 120, 124, 126, 128, 129, 130], "nonbreak": 116, "bit": 116, "typo": [116, 128, 129, 130], "mostli": 116, "cclauss": 116, "readm": [116, 119, 128, 130, 132], "third": [116, 117, 118, 130, 132], "parti": [116, 117, 118, 130, 132], "flake8": 116, "changelog": [116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130], "massiv": [117, 124], "explain": [117, 124, 127], "jessefarebro": [117, 118, 119], "rom": [117, 118], "bash": 117, "autorom": [117, 118], "pip3": 117, "guess": 117, "hotter": 117, "colder": 117, "nchain": 117, "roulett": 117, "kellycoinflip": 117, "rohan138": [117, 118, 119], "tristandeleu": [117, 118, 119, 120], "__setitem__": 117, "jfpettit": 117, "firefoxmetzg": 117, "compli": 117, "redtachyon": [117, 118, 119, 120, 122, 123, 124, 126, 127, 130], "__getitem__": 117, "__len__": 117, "xuehaipan": [117, 118, 119, 126, 130], "gracefulli": 117, "unnecessari": [117, 122], "setup": [117, 123, 132], "resolv": 117, "tuckerbmorgan": 117, "sent": 117, "olimoyo": 117, "registr": [117, 119, 123, 132], "obswrapp": 117, "behav": 117, "raghuspacerajan": 117, "perf_count": 117, "short": 117, "zuoxingdong": 117, "broken": 118, "plugin": [118, 130], "clobber": 118, "hook": [118, 130], "suit": 118, "shorthand": 118, "accident": [118, 122, 124], "refactor": [118, 119, 130], "orderli": 118, "helper": 118, "ahmedo42": 118, "stderr": 118, "compil": 118, "submit": 118, "third_party_environ": 118, "largest": 119, "2524": 119, "site": 119, "gymlibrari": [119, 127], "ml": 119, "curriculum": 119, "reiniti": [119, 141], "expens": 119, "suggest": [119, 136], "kir0ul": [119, 126, 130], "terminal_observ": 119, "nice": 119, "1b15": [119, 125], "seungjaeryanle": 119, "2456": 119, "comment": [119, 122, 130], "consolid": 119, "andrewtanj": [119, 120, 121, 122], "carloslui": 119, "araffin": [119, 124], "pyglet": 119, "frequent": [119, 133], "discreteenv": 119, "hint": [119, 124, 127, 130], "ikamensh": [119, 128, 130], "ton": 119, "cleanup": 119, "markus28": [119, 120, 122, 124, 130], "rushivarora": [119, 120, 121], "jjshoot": [119, 122, 124, 130], "ericonaldo": 119, "adilzouitin": 119, "dramat": 119, "pull": 119, "randomst": 119, "rand": [119, 127], "standard_norm": 119, "consequ": 119, "mt19937": 119, "pcg64": 119, "ahead": 120, "trigaten": 120, "gianlucadecola": [120, 122, 123, 130], "striker": [120, 121], "thrower": [120, 121], "archiv": 120, "rusu24edward": [120, 130], "dsctt": 120, "duburcqa": 120, "videorecord": [121, 130], "2678": 121, "2684": 121, "package_data": 121, "micim": 121, "2683": 121, "1500": 121, "pseudo": [121, 122, 123, 124, 125, 126, 127, 129, 130, 136], "rnd": [121, 122, 123, 124, 125, 126, 127, 129, 130], "thought": [121, 122, 123, 124, 125, 126, 127, 129, 130], "curv": 122, "significantli": [122, 136], "wors": 122, "rodrigodelazcano": [122, 123, 130], "arjun": [122, 124, 126, 127], "kg": [122, 124, 126, 127], "virgilt": 122, "ascii": 122, "googl": 122, "pydoc": 122, "balisujohn": [122, 124, 127, 130], "polygon": 122, "vecenvwrapp": 122, "backend": 122, "backport": 122, "v24": 123, "mujoco_rend": 123, "redund": 123, "quagla": 123, "unpickl": 123, "legaci": 123, "meta": 123, "rescale_act": 123, "subsequ": 124, "smoother": [124, 139], "discourag": 124, "put": [124, 132], "discord": [124, 130], "youni": 124, "2671": 124, "single_rgb_arrai": [124, 127], "2906": 124, "ryanrud": 124, "revert": [124, 125, 127, 130], "kexianshen": 124, "whole": [124, 130], "pyright": 124, "hinter": 124, "strict": [124, 130], "identifi": 124, "psc": [124, 125], "textencod": 124, "johnminelli": 124, "dockerfil": 124, "optimis": 124, "2gb": 124, "5gb": 124, "theden": 124, "younik": [125, 127, 128, 129, 130], "vmoen": [125, 128, 130], "edit": [125, 132], "rephras": 125, "evanmath": 125, "ice1187": 125, "humanoidstandup_v4": 125, "mujoco_env": 125, "vector_list_info": 125, "timgates42": 125, "lin826": [125, 127], "fairli": [126, 141], "_timelimit": 126, "envpool": 126, "__eq__": 126, "8gb": 126, "subse": 126, "olipinski": [126, 130], "metaclass": 126, "youjiacheng": [126, 127, 128], "swig": 126, "annot": [126, 130, 136, 139, 141], "bkrl": 126, "aren": 127, "semant": 127, "terribli": 127, "wrong": 127, "patch": [127, 139], "ve": 127, "stabl": [127, 132], "tremend": 127, "appreci": 127, "patienc": 127, "gone": 127, "hopefulli": [127, 139], "v21": [127, 130], "3040": 127, "3016": 127, "get_stat": 127, "set_stat": 127, "hash_se": 127, "create_se": 127, "_bigint_from_byt": 127, "_int_list_from_bigint": 127, "envapicompat": 127, "3041": 127, "fieteo": 127, "offscreen": [127, 130], "3044": 127, "headless": 127, "3037": 127, "renam": [127, 141], "3036": 127, "3072": 128, "3076": 128, "3080": 128, "foxik": 128, "3083": 128, "rdnfn": 128, "vermouth1992": [129, 130], "harden": [129, 130], "permiss": [129, 130], "sashashura": [129, 130], "clarifi": [129, 130], "ekalosak": [129, 130], "2023": 130, "pypi": 130, "bool8": 130, "bool_": 130, "221": 130, "272": 130, "silent": 130, "ianyfan": 130, "230": 130, "254": 130, "assert": [130, 132], "215": 130, "216": 130, "prompt": 130, "252": 130, "259": 130, "rafaelcp": 130, "277": 130, "gt": 130, "5x": 130, "paulmest": 130, "235": 130, "nidhish": 130, "238": 130, "241": 130, "225": 130, "mgoulao": 130, "257": 130, "246": 130, "explicit": 130, "fail": 130, "pierremardon": 130, "267": 130, "doctest": 130, "valentin": 130, "cnt": 130, "a2c": [130, 135, 137], "till2": 130, "234": 130, "kallinteri": 130, "andrea": 130, "206": 130, "218": 130, "219": 130, "mention": [130, 141], "migrat": 130, "lpizzinidev": 130, "244": 130, "hooper": 130, "247": 130, "convolv": [130, 136, 139], "264": 130, "270": 130, "258": 130, "thank": 130, "contributor": 130, "server": 130, "qualiti": 130, "backlog": 130, "mujocorend": 130, "roadmap": 130, "publicli": 130, "overhaul": 130, "feedback": 130, "interest": 130, "act": [130, 134, 139], "compartment": 130, "funcjaxenv": 130, "potenti": 130, "mechan": 130, "thread": 130, "opengl": 130, "mujocorender": 130, "112": 130, "apply_env_compat": 130, "gymv22environ": 130, "125": 130, "pretti": 130, "print": [130, 132, 134, 136, 141], "kad99kev": 130, "124": 130, "141": 130, "72": 130, "190": 130, "siddarth": [130, 141], "155": 130, "theo": 130, "brown": 130, "74": 130, "mujocoenv": 130, "83": 130, "tobirohr": 130, "89": 130, "117": 130, "thytu": 130, "__all__": 130, "130": 130, "is_slippi": 130, "marionj": 130, "136": 130, "143": 130, "172": 130, "173": 130, "174": 130, "139": 130, "164": 130, "axb2035": 130, "171": 130, "step_wait": 130, "aaronwalsman": 130, "178": 130, "183": 130, "cool": 130, "rr": 130, "184": 130, "186": 130, "208": 130, "codebas": [130, 132], "205": 130, "73": 130, "78": 130, "workflow": 130, "110": 130, "138": 130, "146": 130, "rerun": 130, "commit": 130, "179": 130, "yet": 130, "meantim": 130, "61": 130, "episodestatisticsrecord": 130, "davidslayback": 130, "overflow": 130, "55": 130, "vairodp": 130, "willdudlei": 130, "51": 130, "58": 130, "upstream": 130, "09": 130, "conduct": 130, "overview": [132, 141], "virtual": 132, "git": 132, "venv": 132, "bin": 132, "concern": [132, 141], "gym_exampl": 132, "grid_world": 132, "relative_posit": 132, "reacher_weighted_reward": 132, "discrete_act": 132, "clip_reward": 132, "illustr": [132, 133], "simplist": 132, "gridworldenv": 132, "piec": 132, "abstract": 132, "window_s": 132, "512": 132, "_action_to_direct": 132, "clock": 132, "_get_ob": 132, "mandatori": 132, "_agent_loc": 132, "_target_loc": 132, "manhattan": 132, "_get_info": 132, "oftentim": 132, "worri": 132, "coincid": 132, "earlier": 132, "array_equ": 132, "_render_fram": 132, "trivial": 132, "skeleton": 132, "set_mod": 132, "canva": 132, "pix_square_s": 132, "rect": 132, "gridlin": 132, "width": 132, "visibl": 132, "blit": 132, "get_rect": 132, "pump": 132, "tick": 132, "surfarrai": 132, "pixels3d": 132, "bother": 132, "detect": 132, "appropri": [132, 141], "entrypoint": 132, "mere": 132, "setuptool": 132, "install_requir": 132, "local": 132, "perfectli": 132, "fine": [132, 136], "relativeposit": [132, 134], "ipynb": [132, 133, 134, 136, 139, 141], "did": 133, "failur": 133, "inher": 133, "preserv": 133, "obviou": 133, "forev": 133, "forcibli": 133, "halt": 133, "idea": [133, 139], "tell": [133, 139], "formal": 133, "q_": 133, "o_t": 133, "a_t": 133, "r_t": 133, "max_a": 133, "o_": 133, "a_": [133, 136], "q_target": 133, "distinct": 133, "differenti": 133, "vf_target": 133, "vf_next_stat": 133, "onward": 133, "handling_time_limit": 133, "agent_posit": 134, "target_posit": 134, "discreteact": 134, "disc_to_cont": 134, "__name__": [134, 136], "__main__": 134, "intrins": 134, "clipreward": 134, "nevertheless": 134, "reacherrewardwrapp": 134, "reward_dist_weight": 134, "reward_ctrl_weight": 134, "implementing_custom_wrapp": 134, "a3c": 136, "quicker": 136, "robust": 136, "scratch": [136, 141], "feed": 136, "minibatch": 136, "n_steps_per_upd": 136, "n_env": 136, "gradient": [136, 141], "gae": 136, "tradeoff": 136, "logit": 136, "select_act": 136, "prob": [136, 141], "ent_coef": 136, "encourag": 136, "get_loss": 136, "update_paramet": 136, "zemann": [136, 139], "__future__": [136, 139, 141], "o": [136, 141], "pyplot": [136, 139, 141], "plt": [136, 139, 141], "nn": [136, 141], "tqdm": [136, 139], "maxim": [136, 141], "arg": [136, 139, 141], "n_featur": 136, "n_action": 136, "gpu": 136, "larger": 136, "critic_lr": 136, "actor_lr": 136, "critic_lay": 136, "relu": 136, "actor_lay": 136, "fed": 136, "softmax": 136, "sequenti": [136, 141], "critic_optim": 136, "rmsprop": 136, "lr": [136, 139, 141], "actor_optim": 136, "state_valu": [136, 139], "action_logits_vec": 136, "action_log_prob": 136, "action_logit": 136, "action_pd": 136, "implicitli": 136, "log_prob": [136, 141], "value_pr": 136, "lam": 136, "arxiv": 136, "1506": 136, "02438": 136, "mont": [136, 139, 141], "carlo": [136, 139, 141], "td": 136, "bias": 136, "critic_loss": 136, "actor_loss": 136, "td_error": 136, "pow": 136, "detach": 136, "zero_grad": [136, 141], "epoch": 136, "speedup": 136, "theirfor": 136, "simplest": 136, "parameter": [136, 141], "a_min": 136, "a_max": 136, "proport": 136, "mitig": 136, "remak": 136, "hyperparam": 136, "n_updat": 136, "randomize_domain": 136, "95": [136, 139], "stationari": 136, "obs_shap": 136, "action_shap": 136, "use_cuda": 136, "is_avail": 136, "notic": 136, "envs_wrapp": 136, "bar": 136, "sample_phas": 136, "ep_value_pr": 136, "ep_reward": 136, "ep_action_log_prob": 136, "s_": 136, "state_value_pr": 136, "r_": 136, "squeez": 136, "ongo": 136, "inlin": 136, "rolling_length": [136, 139], "fig": [136, 139], "subplot": [136, 139], "figsiz": [136, 139, 141], "suptitl": [136, 139], "__class__": 136, "set_titl": [136, 139], "episode_returns_moving_averag": 136, "arang": [136, 139], "set_xlabel": [136, 139], "entropy_moving_averag": 136, "critic_losses_moving_averag": 136, "actor_losses_moving_averag": 136, "tight_layout": [136, 139], "karp": 136, "flatt": 136, "120": 136, "enough": 136, "runtim": 136, "save_weight": 136, "load_weight": 136, "actor_weights_path": 136, "actor_weight": 136, "h5": 136, "critic_weights_path": 136, "critic_weight": 136, "mkdir": 136, "state_dict": 136, "load_state_dict": 136, "eval": 136, "n_showcase_episod": 136, "no_grad": 136, "mnih": 136, "badia": 136, "mirza": 136, "grave": 136, "lillicrap": 136, "harlei": 136, "silver": 136, "kavukcuoglu": 136, "icml": 136, "2016": 136, "iclr": 136, "vector_envs_tutori": 136, "tutorials_python": 137, "zip": [137, 141], "tutorials_jupyt": 137, "casino": 139, "infam": 139, "beatabl": 139, "won": 139, "viabl": 139, "strategi": 139, "favorit": 139, "defaultdict": 139, "seaborn": [139, 141], "sn": [139, 141], "explanatori": 139, "slow": 139, "showcas": 139, "respond": 139, "harm": 139, "greedi": 139, "blackjackag": 139, "learning_r": [139, 141], "initial_epsilon": 139, "epsilon_decai": 139, "final_epsilon": 139, "discount_factor": 139, "decai": 139, "training_error": 139, "get_act": 139, "greedili": 139, "exploit": 139, "next_ob": [139, 141], "future_q_valu": 139, "temporal_differ": 139, "decay_epsilon": 139, "readi": 139, "n_episod": 139, "100_000": 139, "start_epsilon": 139, "decent": [139, 141], "converg": 139, "10x": 139, "reward_moving_averag": 139, "length_moving_averag": 139, "training_error_moving_averag": 139, "create_grid": 139, "usable_ac": 139, "action_valu": 139, "player_count": 139, "dealer_count": 139, "meshgrid": 139, "apply_along_axi": 139, "arr": 139, "dstack": 139, "value_grid": 139, "policy_grid": 139, "create_plot": 139, "figaspect": 139, "fontsiz": 139, "ax1": 139, "add_subplot": 139, "plot_surfac": 139, "rstride": 139, "cstride": 139, "cmap": 139, "viridi": 139, "edgecolor": 139, "xtick": 139, "ytick": 139, "set_ylabel": 139, "zaxi": 139, "set_rotate_label": 139, "set_zlabel": 139, "view_init": 139, "220": 139, "ax2": 139, "heatmap": 139, "linewidth": 139, "accent_r": 139, "cbar": 139, "set_xticklabel": 139, "set_yticklabel": 139, "legend": 139, "legend_el": 139, "facecolor": 139, "lightgreen": 139, "label": 139, "grei": 139, "bbox_to_anchor": 139, "fig1": 139, "fig2": 139, "grip": 139, "challeng": 139, "fun": [139, 141], "blackjack_tutori": 139, "earliest": 141, "burden": 141, "inverted_pendulum": 141, "1d": 141, "panda": 141, "pd": 141, "rcparam": 141, "policy_network": 141, "obs_space_dim": 141, "action_space_dim": 141, "hidden_space1": 141, "feel": 141, "hidden_space2": 141, "shared_net": 141, "policy_mean_net": 141, "std": 141, "policy_stddev_net": 141, "action_mean": 141, "action_stddev": 141, "shared_featur": 141, "exp": 141, "fact": 141, "reinfroc": 141, "acronym": 141, "ward": 141, "ncrement": 141, "actor": 141, "ffset": 141, "einforc": 141, "haracterist": 141, "ligibl": 141, "tune": 141, "ep": 141, "adamw": 141, "sample_act": 141, "distrib": 141, "running_g": 141, "delta": 141, "centric": 141, "brittl": 141, "spinningup": 141, "en": 141, "html": 141, "total_num_episod": 141, "5e3": 141, "rewards_over_se": 141, "fibonacci": 141, "manual_se": 141, "reward_over_episod": 141, "avg_reward": 141, "rewards_to_plot": 141, "df1": 141, "datafram": 141, "melt": 141, "inplac": 141, "darkgrid": 141, "talk": 141, "palett": 141, "rainbow": 141, "lineplot": 141, "chandrasekar": 141, "ronald": 141, "connectionist": 141, "2004": 141, "229": 141, "256": 141, "reinforce_invpend_gym_v26": 141}, "objects": {"": [[15, 0, 1, "", "action_space"], [15, 0, 1, "", "observation_space"], [15, 0, 1, "", "single_action_space"], [15, 0, 1, "", "single_observation_space"]], "gymnasium": [[17, 1, 1, "", "ActionWrapper"], [2, 1, 1, "", "Env"], [19, 1, 1, "", "ObservationWrapper"], [20, 1, 1, "", "RewardWrapper"], [16, 1, 1, "", "Wrapper"], [8, 3, 1, "", "make"], [8, 3, 1, "", "pprint_registry"], [8, 3, 1, "", "register"], [9, 5, 0, "-", "spaces"], [8, 3, 1, "", "spec"], [16, 5, 0, "-", "wrappers"]], "gymnasium.ActionWrapper": [[17, 2, 1, "", "action"]], "gymnasium.Env": [[2, 0, 1, "", "action_space"], [2, 3, 1, "", "close"], [2, 0, 1, "", "metadata"], [2, 4, 1, "", "np_random"], [2, 0, 1, "", "observation_space"], [2, 3, 1, "", "render"], [2, 0, 1, "", "render_mode"], [2, 3, 1, "", "reset"], [2, 0, 1, "", "reward_range"], [2, 0, 1, "", "spec"], [2, 3, 1, "", "step"], [2, 4, 1, "", "unwrapped"]], "gymnasium.ObservationWrapper": [[19, 2, 1, "", "observation"]], "gymnasium.RewardWrapper": [[20, 2, 1, "", "reward"]], "gymnasium.Wrapper": [[16, 4, 1, "", "action_space"], [16, 3, 1, "", "close"], [16, 4, 1, "", "metadata"], [16, 4, 1, "", "np_random"], [16, 4, 1, "", "observation_space"], [16, 3, 1, "", "reset"], [16, 4, 1, "", "reward_range"], [16, 4, 1, "", "spec"], [16, 3, 1, "", "step"], [16, 4, 1, "", "unwrapped"]], "gymnasium.experimental": [[4, 1, 1, "", "FuncEnv"]], "gymnasium.experimental.FuncEnv": [[4, 3, 1, "", "initial"], [4, 3, 1, "", "observation"], [4, 3, 1, "", "render_close"], [4, 3, 1, "", "render_image"], [4, 3, 1, "", "render_init"], [4, 3, 1, "", "reward"], [4, 3, 1, "", "state_info"], [4, 3, 1, "", "step_info"], [4, 3, 1, "", "terminal"], [4, 3, 1, "", "transform"], [4, 3, 1, "", "transition"]], "gymnasium.experimental.wrappers": [[7, 1, 1, "", "AtariPreprocessingV0"], [7, 1, 1, "", "AutoresetV0"], [7, 1, 1, "", "ClipActionV0"], [7, 1, 1, "", "ClipRewardV0"], [7, 1, 1, "", "DelayObservationV0"], [7, 1, 1, "", "DtypeObservationV0"], [7, 1, 1, "", "FilterObservationV0"], [7, 1, 1, "", "FlattenObservationV0"], [7, 1, 1, "", "FrameStackObservationV0"], [7, 1, 1, "", "GrayscaleObservationV0"], [7, 1, 1, "", "HumanRenderingV0"], [7, 1, 1, "", "JaxToNumpyV0"], [7, 1, 1, "", "JaxToTorchV0"], [7, 1, 1, "", "LambdaActionV0"], [7, 1, 1, "", "LambdaObservationV0"], [7, 1, 1, "", "LambdaRewardV0"], [7, 1, 1, "", "NormalizeObservationV0"], [7, 1, 1, "", "NormalizeRewardV0"], [7, 1, 1, "", "NumpyToTorchV0"], [7, 1, 1, "", "OrderEnforcingV0"], [7, 1, 1, "", "PassiveEnvCheckerV0"], [7, 1, 1, "", "PixelObservationV0"], [7, 1, 1, "", "RecordEpisodeStatisticsV0"], [7, 1, 1, "", "RecordVideoV0"], [7, 1, 1, "", "RenderCollectionV0"], [7, 1, 1, "", "RescaleActionV0"], [7, 1, 1, "", "RescaleObservationV0"], [7, 1, 1, "", "ReshapeObservationV0"], [7, 1, 1, "", "ResizeObservationV0"], [7, 1, 1, "", "StickyActionV0"], [7, 1, 1, "", "TimeAwareObservationV0"]], "gymnasium.spaces": [[11, 1, 1, "", "Box"], [10, 1, 1, "", "Dict"], [11, 1, 1, "", "Discrete"], [10, 1, 1, "", "Graph"], [11, 1, 1, "", "MultiBinary"], [11, 1, 1, "", "MultiDiscrete"], [10, 1, 1, "", "Sequence"], [9, 1, 1, "", "Space"], [11, 1, 1, "", "Text"], [10, 1, 1, "", "Tuple"]], "gymnasium.spaces.Box": [[11, 2, 1, "", "is_bounded"], [11, 2, 1, "", "sample"], [11, 2, 1, "", "seed"]], "gymnasium.spaces.Dict": [[10, 2, 1, "", "sample"], [10, 2, 1, "", "seed"]], "gymnasium.spaces.Discrete": [[11, 2, 1, "", "sample"], [11, 2, 1, "", "seed"]], "gymnasium.spaces.Graph": [[10, 2, 1, "", "sample"], [10, 2, 1, "", "seed"]], "gymnasium.spaces.MultiBinary": [[11, 2, 1, "", "sample"], [11, 2, 1, "", "seed"]], "gymnasium.spaces.MultiDiscrete": [[11, 2, 1, "", "sample"], [11, 2, 1, "", "seed"]], "gymnasium.spaces.Sequence": [[10, 2, 1, "", "sample"], [10, 2, 1, "", "seed"]], "gymnasium.spaces.Space": [[9, 4, 1, "", "dtype"]], "gymnasium.spaces.Text": [[11, 2, 1, "", "sample"], [11, 2, 1, "", "seed"]], "gymnasium.spaces.Tuple": [[10, 2, 1, "", "sample"], [10, 2, 1, "", "seed"]], "gymnasium.spaces.space.Space": [[9, 3, 1, "", "contains"], [9, 3, 1, "", "from_jsonable"], [9, 4, 1, "", "is_np_flattenable"], [9, 3, 1, "", "sample"], [9, 3, 1, "", "seed"], [9, 4, 1, "", "shape"], [9, 3, 1, "", "to_jsonable"]], "gymnasium.spaces.utils": [[12, 3, 1, "", "flatdim"], [12, 3, 1, "", "flatten"], [12, 3, 1, "", "flatten_space"], [12, 3, 1, "", "unflatten"]], "gymnasium.utils.env_checker": [[14, 3, 1, "", "check_env"]], "gymnasium.utils.play": [[14, 1, 1, "", "PlayPlot"], [14, 1, 1, "", "PlayableGame"], [14, 3, 1, "", "play"]], "gymnasium.utils.play.PlayPlot": [[14, 2, 1, "", "callback"]], "gymnasium.utils.play.PlayableGame": [[14, 2, 1, "", "process_event"]], "gymnasium.utils.save_video": [[14, 3, 1, "", "capped_cubic_video_schedule"], [14, 3, 1, "", "save_video"]], "gymnasium.utils.seeding": [[14, 3, 1, "", "np_random"]], "gymnasium.utils.step_api_compatibility": [[14, 3, 1, "", "convert_to_done_step_api"], [14, 3, 1, "", "convert_to_terminated_truncated_step_api"], [14, 3, 1, "", "step_api_compatibility"]], "gymnasium.vector": [[15, 1, 1, "", "AsyncVectorEnv"], [15, 1, 1, "", "SyncVectorEnv"], [15, 1, 1, "", "VectorEnv"], [15, 3, 1, "", "make"]], "gymnasium.vector.VectorEnv": [[15, 2, 1, "", "close"], [15, 2, 1, "", "reset"], [15, 2, 1, "", "step"]], "gymnasium.vector.utils": [[13, 3, 1, "", "batch_space"], [13, 3, 1, "", "concatenate"], [13, 3, 1, "", "create_empty_array"], [13, 3, 1, "", "create_shared_memory"], [13, 3, 1, "", "iterate"], [13, 3, 1, "", "read_from_shared_memory"], [13, 3, 1, "", "write_to_shared_memory"]], "gymnasium.wrappers": [[18, 1, 1, "", "AtariPreprocessing"], [18, 1, 1, "", "AutoResetWrapper"], [17, 1, 1, "", "ClipAction"], [18, 1, 1, "", "EnvCompatibility"], [19, 1, 1, "", "FilterObservation"], [19, 1, 1, "", "FlattenObservation"], [19, 1, 1, "", "FrameStack"], [19, 1, 1, "", "GrayScaleObservation"], [18, 1, 1, "", "HumanRendering"], [19, 1, 1, "", "NormalizeObservation"], [20, 1, 1, "", "NormalizeReward"], [18, 1, 1, "", "OrderEnforcing"], [18, 1, 1, "", "PassiveEnvChecker"], [19, 1, 1, "", "PixelObservationWrapper"], [18, 1, 1, "", "RecordEpisodeStatistics"], [18, 1, 1, "", "RecordVideo"], [18, 1, 1, "", "RenderCollection"], [17, 1, 1, "", "RescaleAction"], [19, 1, 1, "", "ResizeObservation"], [18, 1, 1, "", "StepAPICompatibility"], [19, 1, 1, "", "TimeAwareObservation"], [18, 1, 1, "", "TimeLimit"], [19, 1, 1, "", "TransformObservation"], [20, 1, 1, "", "TransformReward"], [18, 1, 1, "", "VectorListInfo"]], "gymnasium.wrappers.gymnasium.Wrapper": [[16, 0, 1, "", "env"]]}, "objtypes": {"0": "py:attribute", "1": "py:class", "2": "py:method", "3": "py:function", "4": "py:property", "5": "py:module"}, "objnames": {"0": ["py", "attribute", "Python attribute"], "1": ["py", "class", "Python class"], "2": ["py", "method", "Python method"], "3": ["py", "function", "Python function"], "4": ["py", "property", "Python property"], "5": ["py", "module", "Python module"]}, "titleterms": {"404": 0, "page": [0, 1], "Not": 0, "found": 0, "The": [0, 9], "request": 0, "could": 0, "gymnasium": [1, 2, 4, 5, 15, 16, 115, 131, 132, 134, 135, 137], "doc": 1, "instruct": 1, "modifi": [1, 21], "environ": [1, 2, 3, 4, 5, 6, 7, 8, 14, 15, 21, 22, 23, 109, 115, 119, 132, 136, 139], "edit": 1, "an": [1, 139, 141], "ad": 1, "new": [1, 14, 116, 117], "atari": [1, 24, 43], "env": [1, 2, 15, 109, 132, 136], "non": 1, "other": [1, 7, 109, 116, 119], "step": [1, 14, 22, 23, 132], "build": [1, 139, 141], "document": 1, "write": 1, "tutori": [1, 137], "method": [2, 9, 15, 16], "attribut": [2, 9, 15, 16], "addit": 2, "implement": [2, 134], "experiment": [3, 4, 5], "function": [3, 4], "wrapper": [3, 6, 7, 16, 17, 18, 19, 20, 23, 132, 134], "observ": [3, 6, 7, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 132, 139], "action": [3, 6, 7, 17, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 139], "reward": [3, 6, 7, 20, 24, 27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "common": [3, 6, 24], "render": [3, 7, 14, 23, 132], "data": [3, 7], "convers": [3, 7], "vector": [3, 5, 6, 9, 13, 15, 136], "funcenv": 4, "func2env": 4, "functionaljaxcompatibilityenv": 4, "vectorenv": [5, 15], "asyncvectorenv": 5, "syncvectorenv": 5, "custom": [5, 132, 134], "envpool": 5, "lambda": 6, "onli": 6, "registri": 8, "make": [8, 15, 132], "regist": [8, 132], "all": 8, "spec": 8, "pretti": 8, "print": 8, "space": [9, 10, 11, 12, 13, 21, 24, 50, 51, 52, 53, 54, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "base": [9, 17, 19, 20], "class": [9, 17, 19, 20], "fundament": [9, 11], "composit": [9, 10], "util": [9, 12, 13, 14], "dict": 10, "tupl": 10, "sequenc": 10, "graph": 10, "box": [11, 38], "discret": [11, 109], "multibinari": 11, "multidiscret": 11, "text": [11, 110], "share": 13, "memori": 13, "visual": [14, 139], "save": [14, 136], "video": [14, 84, 109], "old": 14, "api": [14, 22, 115, 119, 124], "compat": [14, 22, 127], "seed": [14, 23], "check": 14, "async": 15, "sync": 15, "avail": [17, 19, 20], "misc": [18, 124], "basic": [21, 131, 135, 137], "usag": 21, "initi": [21, 130, 132], "interact": 21, "explain": 21, "code": [21, 23, 133], "more": 21, "inform": [21, 111, 112, 113, 114], "gym": [22, 109, 130], "load": [22, 136], "openai": [22, 109], "v0": [22, 116, 117, 118, 119, 120, 121, 122, 123, 124, 126, 127, 128, 129, 130], "22": [22, 119], "v21": 23, "v26": 23, "migrat": 23, "guid": 23, "exampl": 23, "random": [23, 136], "number": 23, "gener": 23, "reset": [23, 89, 132], "timelimit": 23, "remov": 23, "autorom": 24, "instal": 24, "rom": 24, "stochast": 24, "argument": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "version": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114], "histori": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "name": [24, 64], "scheme": 24, "flavor": 24, "refer": [24, 89, 92, 111, 112, 114, 115, 136, 141], "adventur": 25, "descript": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "air": 26, "raid": 26, "alien": 27, "amidar": 28, "assault": 29, "asterix": 30, "asteroid": 31, "atlanti": 32, "bank": 33, "heist": 33, "battl": 34, "zone": 34, "beam": 35, "rider": 35, "berzerk": 36, "bowl": 37, "breakout": 39, "carniv": 40, "centiped": 41, "chopper": 42, "command": 42, "complet": 43, "list": 43, "crazi": 44, "climber": 44, "defend": 45, "demon": 46, "attack": 46, "doubl": [47, 103], "dunk": 47, "elev": 48, "enduro": 49, "fishingderbi": 50, "freewai": 51, "frostbit": 52, "gopher": 53, "gravitar": 54, "hero": 55, "icehockei": 56, "jamesbond": 57, "journeyescap": 58, "kangaroo": 59, "krull": 60, "kung": 61, "fu": 61, "master": 61, "montezuma": 62, "reveng": 62, "m": 63, "pacman": 63, "thi": 64, "game": [64, 109], "phoenix": 65, "pitfal": 66, "pong": 67, "pooyan": 68, "privateey": 69, "qbert": 70, "riverraid": 71, "road": 72, "runner": 72, "robot": [73, 109], "tank": 73, "seaquest": 74, "ski": 75, "solari": 76, "spaceinvad": 77, "stargunn": 78, "tenni": 79, "timepilot": 80, "tutankham": 81, "up": 82, "n": 82, "down": 82, "ventur": 83, "pinbal": 84, "wizard": 85, "wor": 85, "zaxxon": 86, "box2d": 87, "biped": 88, "walker": 88, "start": [88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "state": [88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 132], "episod": [88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "termin": [88, 89, 90, 133], "credit": [88, 89, 90], "car": [89, 94, 95], "race": [89, 109], "lunar": 90, "lander": 90, "classic": [91, 109], "control": [91, 109], "acrobot": 92, "end": [92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "cart": 93, "pole": 93, "mountain": [94, 95], "transit": [94, 95], "dynam": [94, 95, 109], "continu": 95, "pendulum": [96, 103, 104], "truncat": [96, 133], "mujoco": [97, 141], "ant": 98, "half": 99, "cheetah": 99, "hopper": 100, "humanoid": [101, 102], "standup": 102, "invert": [103, 104], "pusher": 105, "reacher": 106, "swimmer": 107, "note": [107, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130], "walker2d": 108, "third": 109, "parti": 109, "stabl": 109, "retro": 109, "maintain": 109, "flappi": 109, "bird": 109, "A": 109, "derk": 109, "gpu": 109, "acceler": 109, "moba": 109, "slimevolleygym": 109, "simpl": 109, "singl": 109, "multi": 109, "agent": [109, 136, 137, 138, 139, 140, 141], "reinforc": [109, 115, 141], "learn": [109, 115, 133, 139, 141], "uniti": 109, "ml": 109, "engin": 109, "pge": 109, "parallel": 109, "jimini": 109, "train": [109, 136, 137, 138, 139, 140, 141], "pybullet": 109, "drone": 109, "quadcopt": 109, "marsexplor": 109, "mar": 109, "panda": 109, "us": [109, 132, 136, 141], "physic": 109, "robo": 109, "real": 109, "world": 109, "simul": 109, "offworld": 109, "safe": 109, "softrobot": 109, "soft": 109, "igibson": 109, "dexteroushand": 109, "dual": 109, "dexter": 109, "hand": 109, "manipul": 109, "task": 109, "omniisaacgymenv": 109, "autonom": 109, "drive": 109, "sumo": 109, "rl": 109, "duckietown": 109, "electr": 109, "motor": 109, "highwai": 109, "commonroad": 109, "tmrl": 109, "trackmania": 109, "2020": 109, "through": 109, "racing_dream": 109, "l2r": 109, "multimod": 109, "where": 109, "how": 109, "racecar_gym": 109, "compilergym": 109, "optimis": 109, "compil": 109, "carl": 109, "context": 109, "adapt": 109, "matrix": 109, "mdp": 109, "easili": 109, "creat": [109, 132], "mo": 109, "object": 109, "cellular": 109, "automata": 109, "sokoban": 109, "2d": 109, "transport": 109, "puzzl": 109, "dacbench": 109, "benchmark": 109, "librari": 109, "algorithm": 109, "configur": 109, "nlpgym": 109, "toolkit": 109, "develop": 109, "solv": [109, 139], "nlp": 109, "satur": 109, "prove": 109, "theorem": 109, "shinrl": 109, "evalu": 109, "gymnax": 109, "hardwar": 109, "anytrad": 109, "financi": 109, "trade": 109, "forex": 109, "stock": 109, "mtsim": 109, "metatrad": 109, "5": 109, "platform": 109, "openmodelica": 109, "microgrid": 109, "power": 109, "electron": 109, "convert": 109, "mobil": 109, "coordin": 109, "wireless": 109, "network": [109, 141], "gymfc": 109, "flight": 109, "tune": 109, "framework": 109, "toi": 110, "blackjack": [111, 139], "cliff": 112, "walk": 112, "frozen": 113, "lake": 113, "taxi": 114, "i": 115, "standard": 115, "divers": 115, "collect": 115, "19": 116, "0": [116, 117, 118, 120, 122, 124, 125, 127, 130], "releas": [116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130], "featur": [116, 117], "bug": [116, 117, 123, 124, 125, 126, 128, 129], "fix": [116, 117, 123, 124, 125, 126, 128, 129], "20": 117, "major": [117, 122, 127], "chang": [117, 119, 120, 122, 124, 127], "break": [117, 120, 127], "upgrad": 117, "21": 118, "23": [120, 121], "1": [121, 123, 125, 128, 130], "24": [122, 123], "minor": [122, 127], "25": [124, 125, 126], "typo": 125, "2": [126, 129, 130], "updat": 126, "26": [127, 128, 129, 130], "backward": 127, "spell": 128, "27": 130, "3": 130, "your": 132, "own": 132, "subclass": 132, "declar": 132, "construct": 132, "from": [132, 134], "close": 132, "packag": 132, "instanc": 132, "handl": 133, "time": 133, "limit": 133, "import": [133, 139], "solut": 133, "inherit": 134, "observationwrapp": 134, "actionwrapp": 134, "rewardwrapp": 134, "a2c": 136, "domain": 136, "introduct": 136, "advantag": 136, "actor": 136, "critic": 136, "setup": [136, 139], "plot": [136, 141], "perform": 136, "analysi": 136, "synchron": 136, "asynchron": 136, "weight": 136, "showcas": 136, "try": 136, "plai": 136, "yourself": 136, "q": 139, "execut": 139, "visualis": 139, "polici": [139, 141], "think": 139, "you": 139, "can": 139, "do": 139, "better": 139, "curv": 141}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 8, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx": 57}, "alltitles": {"404 - Page Not Found": [[0, "page-not-found"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Gymnasium-docs": [[1, "gymnasium-docs"]], "Instructions for modifying environment pages": [[1, "instructions-for-modifying-environment-pages"]], "Editing an environment page": [[1, "editing-an-environment-page"]], "Adding a new environment": [[1, "adding-a-new-environment"]], "Atari env": [[1, "atari-env"]], "Non-Atari env": [[1, "non-atari-env"]], "Other steps": [[1, "other-steps"]], "Build the Documentation": [[1, "build-the-documentation"]], "Writing Tutorials": [[1, "writing-tutorials"]], "Env": [[2, "env"]], "gymnasium.Env": [[2, "gymnasium-env"]], "Methods": [[2, "methods"], [9, "methods"], [15, "methods"], [16, "methods"]], "Attributes": [[2, "attributes"], [9, "attributes"], [15, "attributes"], [16, "attributes"]], "Additional Methods": [[2, "additional-methods"]], "Implementing environments": [[2, "implementing-environments"]], "Experimental": [[3, "experimental"]], "Functional Environments": [[3, "functional-environments"]], "Wrappers": [[3, "wrappers"], [7, "wrappers"], [16, "wrappers"]], "Observation Wrappers": [[3, "observation-wrappers"], [7, "observation-wrappers"], [19, "observation-wrappers"]], "Action Wrappers": [[3, "action-wrappers"], [7, "action-wrappers"], [17, "action-wrappers"]], "Reward Wrappers": [[3, "reward-wrappers"], [7, "reward-wrappers"], [20, "reward-wrappers"]], "Common Wrappers": [[3, "common-wrappers"]], "Rendering Wrappers": [[3, "rendering-wrappers"], [7, "rendering-wrappers"]], "Environment data conversion": [[3, "environment-data-conversion"], [7, "environment-data-conversion"]], "Vector Environment": [[3, "vector-environment"]], "Wrappers for Vector Environments": [[3, "wrappers-for-vector-environments"]], "Functional Environment": [[4, "functional-environment"]], "gymnasium.experimental.FuncEnv": [[4, "gymnasium-experimental-funcenv"]], "gymnasium.experimental.func2env.FunctionalJaxCompatibilityEnv": [[4, "gymnasium-experimental-func2env-functionaljaxcompatibilityenv"]], "Vectorizing Environment": [[5, "vectorizing-environment"]], "gymnasium.experimental.VectorEnv": [[5, "gymnasium-experimental-vectorenv"]], "gymnasium.experimental.vector.AsyncVectorEnv": [[5, "gymnasium-experimental-vector-asyncvectorenv"]], "gymnasium.experimental.vector.SyncVectorEnv": [[5, "gymnasium-experimental-vector-syncvectorenv"]], "Custom Vector environments": [[5, "custom-vector-environments"]], "EnvPool": [[5, "envpool"]], "Vector Environment Wrappers": [[6, "vector-environment-wrappers"]], "Vector Lambda Observation Wrappers": [[6, "vector-lambda-observation-wrappers"]], "Vector Lambda Action Wrappers": [[6, "vector-lambda-action-wrappers"]], "Vector Lambda Reward Wrappers": [[6, "vector-lambda-reward-wrappers"]], "Vector Common Wrappers": [[6, "vector-common-wrappers"]], "Vector Only Wrappers": [[6, "vector-only-wrappers"]], "Other Wrappers": [[7, "other-wrappers"]], "Registry": [[8, "registry"]], "Make": [[8, "make"]], "Register": [[8, "register"]], "All registered environments": [[8, "all-registered-environments"]], "Spec": [[8, "spec"]], "Pretty print registry": [[8, "pretty-print-registry"]], "Spaces": [[9, "spaces"]], "The Base Class": [[9, "the-base-class"]], "Fundamental Spaces": [[9, "fundamental-spaces"], [11, "fundamental-spaces"]], "Composite Spaces": [[9, "composite-spaces"], [10, "composite-spaces"]], "Utils": [[9, "utils"], [14, "utils"]], "Vector Utils": [[9, "vector-utils"]], "Dict": [[10, "dict"]], "Tuple": [[10, "tuple"]], "Sequence": [[10, "sequence"]], "Graph": [[10, "graph"]], "Box": [[11, "box"]], "Discrete": [[11, "discrete"]], "MultiBinary": [[11, "multibinary"]], "MultiDiscrete": [[11, "multidiscrete"]], "Text": [[11, "text"]], "Spaces Utils": [[12, "spaces-utils"]], "Spaces Vector Utils": [[13, "spaces-vector-utils"]], "Shared Memory Utils": [[13, "shared-memory-utils"]], "Visualization": [[14, "visualization"]], "Save Rendering Videos": [[14, "save-rendering-videos"]], "Old to New Step API Compatibility": [[14, "old-to-new-step-api-compatibility"]], "Seeding": [[14, "seeding"]], "Environment Checking": [[14, "environment-checking"]], "Vector": [[15, "vector"]], "Gymnasium.vector.VectorEnv": [[15, "gymnasium-vector-vectorenv"]], "Making Vector Environments": [[15, "making-vector-environments"]], "Async Vector Env": [[15, "async-vector-env"]], "Sync Vector Env": [[15, "sync-vector-env"]], "gymnasium.Wrapper": [[16, "gymnasium-wrapper"]], "Gymnasium Wrappers": [[16, "gymnasium-wrappers"]], "Base Class": [[17, "base-class"], [19, "base-class"], [20, "base-class"]], "Available Action Wrappers": [[17, "available-action-wrappers"]], "Misc Wrappers": [[18, "misc-wrappers"]], "Available Observation Wrappers": [[19, "available-observation-wrappers"]], "Available Reward Wrappers": [[20, "available-reward-wrappers"]], "Basic Usage": [[21, "basic-usage"]], "Initializing Environments": [[21, "initializing-environments"]], "Interacting with the Environment": [[21, "interacting-with-the-environment"]], "Explaining the code": [[21, "explaining-the-code"]], "Action and observation spaces": [[21, "action-and-observation-spaces"]], "Modifying the environment": [[21, "modifying-the-environment"]], "More information": [[21, "more-information"]], "Compatibility with Gym": [[22, "compatibility-with-gym"]], "Loading OpenAI Gym environments": [[22, "loading-openai-gym-environments"]], "Gym v0.22 Environment Compatibility": [[22, "gym-v0-22-environment-compatibility"]], "Step API Compatibility": [[22, "step-api-compatibility"]], "v21 to v26 Migration Guide": [[23, "v21-to-v26-migration-guide"]], "Example code for v21": [[23, "example-code-for-v21"]], "Example code for v26": [[23, "example-code-for-v26"]], "Seed and random number generator": [[23, "seed-and-random-number-generator"]], "Environment Reset": [[23, "environment-reset"]], "Environment Step": [[23, "environment-step"]], "TimeLimit Wrapper": [[23, "timelimit-wrapper"]], "Environment Render": [[23, "environment-render"]], "Removed code": [[23, "removed-code"]], "Atari": [[24, "atari"]], "AutoROM (installing the ROMs)": [[24, "autorom-installing-the-roms"]], "Action Space": [[24, "action-space"], [50, "action-space"], [51, "action-space"], [52, "action-space"], [53, "action-space"], [54, "action-space"], [88, "action-space"], [89, "action-space"], [90, "action-space"], [92, "action-space"], [93, "action-space"], [94, "action-space"], [95, "action-space"], [96, "action-space"], [98, "action-space"], [99, "action-space"], [100, "action-space"], [101, "action-space"], [102, "action-space"], [103, "action-space"], [104, "action-space"], [105, "action-space"], [106, "action-space"], [107, "action-space"], [108, "action-space"], [111, "action-space"], [112, "action-space"], [113, "action-space"], [114, "action-space"]], "Observation Space": [[24, "observation-space"], [88, "observation-space"], [89, "observation-space"], [90, "observation-space"], [92, "observation-space"], [93, "observation-space"], [94, "observation-space"], [95, "observation-space"], [96, "observation-space"], [98, "observation-space"], [99, "observation-space"], [100, "observation-space"], [101, "observation-space"], [102, "observation-space"], [103, "observation-space"], [104, "observation-space"], [105, "observation-space"], [106, "observation-space"], [107, "observation-space"], [108, "observation-space"], [111, "observation-space"], [112, "observation-space"], [113, "observation-space"], [114, "observation-space"]], "Rewards": [[24, "rewards"], [27, "rewards"], [28, "rewards"], [30, "rewards"], [31, "rewards"], [32, "rewards"], [33, "rewards"], [34, "rewards"], [35, "rewards"], [36, "rewards"], [37, "rewards"], [38, "rewards"], [39, "rewards"], [40, "rewards"], [41, "rewards"], [42, "rewards"], [44, "rewards"], [45, "rewards"], [46, "rewards"], [47, "rewards"], [48, "rewards"], [49, "rewards"], [50, "rewards"], [51, "rewards"], [52, "rewards"], [53, "rewards"], [54, "rewards"], [55, "rewards"], [56, "rewards"], [57, "rewards"], [58, "rewards"], [59, "rewards"], [60, "rewards"], [66, "rewards"], [67, "rewards"], [68, "rewards"], [69, "rewards"], [70, "rewards"], [71, "rewards"], [72, "rewards"], [73, "rewards"], [74, "rewards"], [75, "rewards"], [76, "rewards"], [77, "rewards"], [78, "rewards"], [79, "rewards"], [80, "rewards"], [88, "rewards"], [89, "rewards"], [90, "rewards"], [92, "rewards"], [93, "rewards"], [96, "rewards"], [98, "rewards"], [99, "rewards"], [100, "rewards"], [101, "rewards"], [102, "rewards"], [103, "rewards"], [104, "rewards"], [105, "rewards"], [106, "rewards"], [107, "rewards"], [108, "rewards"], [111, "rewards"], [113, "rewards"], [114, "rewards"]], "Stochasticity": [[24, "stochasticity"]], "Common Arguments": [[24, "common-arguments"]], "Version History and Naming Schemes": [[24, "version-history-and-naming-schemes"]], "Flavors": [[24, "flavors"]], "References": [[24, "references"], [89, "references"], [92, "references"], [111, "references"], [112, "references"], [114, "references"], [136, "references"], [141, "references"]], "Adventure": [[25, "adventure"]], "Description": [[25, "description"], [26, "description"], [27, "description"], [28, "description"], [29, "description"], [30, "description"], [31, "description"], [32, "description"], [33, "description"], [34, "description"], [35, "description"], [36, "description"], [37, "description"], [38, "description"], [39, "description"], [40, "description"], [41, "description"], [42, "description"], [44, "description"], [45, "description"], [46, "description"], [47, "description"], [48, "description"], [49, "description"], [50, "description"], [51, "description"], [52, "description"], [53, "description"], [54, "description"], [55, "description"], [56, "description"], [57, "description"], [58, "description"], [59, "description"], [60, "description"], [61, "description"], [62, "description"], [63, "description"], [64, "description"], [65, "description"], [66, "description"], [67, "description"], [68, "description"], [69, "description"], [70, "description"], [71, "description"], [72, "description"], [73, "description"], [74, "description"], [75, "description"], [76, "description"], [77, "description"], [78, "description"], [79, "description"], [80, "description"], [81, "description"], [82, "description"], [83, "description"], [84, "description"], [85, "description"], [86, "description"], [88, "description"], [89, "description"], [90, "description"], [92, "description"], [93, "description"], [94, "description"], [95, "description"], [96, "description"], [98, "description"], [99, "description"], [100, "description"], [101, "description"], [102, "description"], [103, "description"], [104, "description"], [105, "description"], [106, "description"], [107, "description"], [108, "description"], [111, "description"], [112, "description"], [113, "description"], [114, "description"]], "Actions": [[25, "actions"], [26, "actions"], [27, "actions"], [28, "actions"], [29, "actions"], [30, "actions"], [31, "actions"], [32, "actions"], [33, "actions"], [34, "actions"], [35, "actions"], [36, "actions"], [37, "actions"], [38, "actions"], [39, "actions"], [40, "actions"], [41, "actions"], [42, "actions"], [44, "actions"], [45, "actions"], [46, "actions"], [47, "actions"], [48, "actions"], [49, "actions"], [55, "actions"], [56, "actions"], [57, "actions"], [58, "actions"], [59, "actions"], [60, "actions"], [61, "actions"], [62, "actions"], [63, "actions"], [64, "actions"], [65, "actions"], [66, "actions"], [67, "actions"], [68, "actions"], [69, "actions"], [70, "actions"], [71, "actions"], [72, "actions"], [73, "actions"], [74, "actions"], [75, "actions"], [76, "actions"], [77, "actions"], [78, "actions"], [79, "actions"], [80, "actions"], [81, "actions"], [82, "actions"], [83, "actions"], [84, "actions"], [85, "actions"], [86, "actions"]], "Observations": [[25, "observations"], [26, "observations"], [27, "observations"], [28, "observations"], [29, "observations"], [30, "observations"], [31, "observations"], [32, "observations"], [33, "observations"], [34, "observations"], [35, "observations"], [36, "observations"], [37, "observations"], [38, "observations"], [39, "observations"], [40, "observations"], [41, "observations"], [42, "observations"], [44, "observations"], [45, "observations"], [46, "observations"], [47, "observations"], [48, "observations"], [49, "observations"], [50, "observations"], [51, "observations"], [52, "observations"], [53, "observations"], [54, "observations"], [55, "observations"], [56, "observations"], [57, "observations"], [58, "observations"], [59, "observations"], [60, "observations"], [61, "observations"], [62, "observations"], [63, "observations"], [64, "observations"], [65, "observations"], [66, "observations"], [67, "observations"], [68, "observations"], [69, "observations"], [70, "observations"], [71, "observations"], [72, "observations"], [73, "observations"], [74, "observations"], [75, "observations"], [76, "observations"], [77, "observations"], [78, "observations"], [79, "observations"], [80, "observations"], [81, "observations"], [82, "observations"], [83, "observations"], [84, "observations"], [85, "observations"], [86, "observations"]], "Arguments": [[25, "arguments"], [26, "arguments"], [27, "arguments"], [28, "arguments"], [29, "arguments"], [30, "arguments"], [31, "arguments"], [32, "arguments"], [33, "arguments"], [34, "arguments"], [35, "arguments"], [36, "arguments"], [37, "arguments"], [38, "arguments"], [39, "arguments"], [40, "arguments"], [41, "arguments"], [42, "arguments"], [44, "arguments"], [45, "arguments"], [46, "arguments"], [47, "arguments"], [48, "arguments"], [49, "arguments"], [50, "arguments"], [51, "arguments"], [52, "arguments"], [53, "arguments"], [54, "arguments"], [55, "arguments"], [56, "arguments"], [57, "arguments"], [58, "arguments"], [59, "arguments"], [60, "arguments"], [61, "arguments"], [62, "arguments"], [63, "arguments"], [64, "arguments"], [65, "arguments"], [66, "arguments"], [67, "arguments"], [68, "arguments"], [69, "arguments"], [70, "arguments"], [71, "arguments"], [72, "arguments"], [73, "arguments"], [74, "arguments"], [75, "arguments"], [76, "arguments"], [77, "arguments"], [78, "arguments"], [79, "arguments"], [80, "arguments"], [81, "arguments"], [82, "arguments"], [83, "arguments"], [84, "arguments"], [85, "arguments"], [86, "arguments"], [88, "arguments"], [89, "arguments"], [90, "arguments"], [92, "arguments"], [93, "arguments"], [94, "arguments"], [95, "arguments"], [96, "arguments"], [98, "arguments"], [99, "arguments"], [100, "arguments"], [101, "arguments"], [102, "arguments"], [103, "arguments"], [104, "arguments"], [105, "arguments"], [106, "arguments"], [107, "arguments"], [108, "arguments"], [111, "arguments"], [112, "arguments"], [113, "arguments"], [114, "arguments"]], "Version History": [[25, "version-history"], [26, "version-history"], [27, "version-history"], [28, "version-history"], [29, "version-history"], [30, "version-history"], [31, "version-history"], [32, "version-history"], [33, "version-history"], [34, "version-history"], [35, "version-history"], [36, "version-history"], [37, "version-history"], [38, "version-history"], [39, "version-history"], [40, "version-history"], [41, "version-history"], [42, "version-history"], [44, "version-history"], [45, "version-history"], [46, "version-history"], [47, "version-history"], [48, "version-history"], [49, "version-history"], [50, "version-history"], [51, "version-history"], [52, "version-history"], [53, "version-history"], [54, "version-history"], [55, "version-history"], [56, "version-history"], [57, "version-history"], [58, "version-history"], [59, "version-history"], [60, "version-history"], [61, "version-history"], [62, "version-history"], [63, "version-history"], [64, "version-history"], [65, "version-history"], [66, "version-history"], [67, "version-history"], [68, "version-history"], [69, "version-history"], [70, "version-history"], [71, "version-history"], [72, "version-history"], [73, "version-history"], [74, "version-history"], [75, "version-history"], [76, "version-history"], [77, "version-history"], [78, "version-history"], [79, "version-history"], [80, "version-history"], [81, "version-history"], [82, "version-history"], [83, "version-history"], [84, "version-history"], [85, "version-history"], [86, "version-history"], [88, "version-history"], [89, "version-history"], [90, "version-history"], [92, "version-history"], [94, "version-history"], [95, "version-history"], [96, "version-history"], [98, "version-history"], [99, "version-history"], [100, "version-history"], [101, "version-history"], [102, "version-history"], [103, "version-history"], [104, "version-history"], [105, "version-history"], [106, "version-history"], [107, "version-history"], [108, "version-history"], [111, "version-history"], [112, "version-history"], [113, "version-history"], [114, "version-history"]], "Air Raid": [[26, "air-raid"]], "Alien": [[27, "alien"]], "Amidar": [[28, "amidar"]], "Assault": [[29, "assault"]], "Asterix": [[30, "asterix"]], "Asteroids": [[31, "asteroids"]], "Atlantis": [[32, "atlantis"]], "Bank Heist": [[33, "bank-heist"]], "Battle Zone": [[34, "battle-zone"]], "Beam Rider": [[35, "beam-rider"]], "Berzerk": [[36, "berzerk"]], "Bowling": [[37, "bowling"]], "Boxing": [[38, "boxing"]], "Breakout": [[39, "breakout"]], "Carnival": [[40, "carnival"]], "Centipede": [[41, "centipede"]], "Chopper Command": [[42, "chopper-command"]], "Complete List - Atari": [[43, "complete-list-atari"]], "Crazy Climber": [[44, "crazy-climber"]], "Defender": [[45, "defender"]], "Demon Attack": [[46, "demon-attack"]], "Double Dunk": [[47, "double-dunk"]], "Elevator Action": [[48, "elevator-action"]], "Enduro": [[49, "enduro"]], "FishingDerby": [[50, "fishingderby"]], "Freeway": [[51, "freeway"]], "Frostbite": [[52, "frostbite"]], "Gopher": [[53, "gopher"]], "Gravitar": [[54, "gravitar"]], "Hero": [[55, "hero"]], "IceHockey": [[56, "icehockey"]], "Jamesbond": [[57, "jamesbond"]], "JourneyEscape": [[58, "journeyescape"]], "Kangaroo": [[59, "kangaroo"]], "Krull": [[60, "krull"]], "Kung Fu Master": [[61, "kung-fu-master"]], "Montezuma Revenge": [[62, "montezuma-revenge"]], "Ms Pacman": [[63, "ms-pacman"]], "Name This Game": [[64, "name-this-game"]], "Phoenix": [[65, "phoenix"]], "Pitfall": [[66, "pitfall"]], "Pong": [[67, "pong"]], "Pooyan": [[68, "pooyan"]], "PrivateEye": [[69, "privateeye"]], "Qbert": [[70, "qbert"]], "Riverraid": [[71, "riverraid"]], "Road Runner": [[72, "road-runner"]], "Robot Tank": [[73, "robot-tank"]], "Seaquest": [[74, "seaquest"]], "Skiings": [[75, "skiings"]], "Solaris": [[76, "solaris"]], "SpaceInvaders": [[77, "spaceinvaders"]], "StarGunner": [[78, "stargunner"]], "Tennis": [[79, "tennis"]], "TimePilot": [[80, "timepilot"]], "Tutankham": [[81, "tutankham"]], "Up n\u2019 Down": [[82, "up-n-down"]], "Venture": [[83, "venture"]], "Video Pinball": [[84, "video-pinball"]], "Wizard of Wor": [[85, "wizard-of-wor"]], "Zaxxon": [[86, "zaxxon"]], "Box2D": [[87, "box2d"]], "Bipedal Walker": [[88, "bipedal-walker"]], "Starting State": [[88, "starting-state"], [89, "starting-state"], [90, "starting-state"], [92, "starting-state"], [93, "starting-state"], [94, "starting-state"], [95, "starting-state"], [96, "starting-state"], [98, "starting-state"], [99, "starting-state"], [100, "starting-state"], [101, "starting-state"], [102, "starting-state"], [103, "starting-state"], [104, "starting-state"], [105, "starting-state"], [106, "starting-state"], [107, "starting-state"], [108, "starting-state"], [111, "starting-state"], [112, "starting-state"], [113, "starting-state"], [114, "starting-state"]], "Episode Termination": [[88, "episode-termination"], [89, "episode-termination"], [90, "episode-termination"]], "Credits": [[88, "credits"], [89, "credits"], [90, "credits"]], "Car Racing": [[89, "car-racing"]], "Reset Arguments": [[89, "reset-arguments"]], "Lunar Lander": [[90, "lunar-lander"]], "Classic Control": [[91, "classic-control"]], "Acrobot": [[92, "acrobot"]], "Episode End": [[92, "episode-end"], [93, "episode-end"], [94, "episode-end"], [95, "episode-end"], [98, "episode-end"], [99, "episode-end"], [100, "episode-end"], [101, "episode-end"], [102, "episode-end"], [103, "episode-end"], [104, "episode-end"], [105, "episode-end"], [106, "episode-end"], [107, "episode-end"], [108, "episode-end"], [111, "episode-end"], [112, "episode-end"], [113, "episode-end"], [114, "episode-end"]], "Cart Pole": [[93, "cart-pole"]], "Mountain Car": [[94, "mountain-car"]], "Transition Dynamics:": [[94, "transition-dynamics"], [95, "transition-dynamics"]], "Reward:": [[94, "reward"]], "Mountain Car Continuous": [[95, "mountain-car-continuous"]], "Reward": [[95, "reward"], [112, "reward"]], "Pendulum": [[96, "pendulum"]], "Episode Truncation": [[96, "episode-truncation"]], "MuJoCo": [[97, "mujoco"]], "Ant": [[98, "ant"]], "Half Cheetah": [[99, "half-cheetah"]], "Hopper": [[100, "hopper"]], "Humanoid": [[101, "humanoid"]], "Humanoid Standup": [[102, "humanoid-standup"]], "Inverted Double Pendulum": [[103, "inverted-double-pendulum"]], "Inverted Pendulum": [[104, "inverted-pendulum"]], "Pusher": [[105, "pusher"]], "Reacher": [[106, "reacher"]], "Swimmer": [[107, "swimmer"]], "Notes": [[107, "notes"]], "Walker2D": [[108, "walker2d"]], "Third-party Environments": [[109, "third-party-environments"]], "Video Game environments": [[109, "video-game-environments"]], "stable-retro: Classic retro games, a maintained version of OpenAI Retro": [[109, "stable-retro-classic-retro-games-a-maintained-version-of-openai-retro"]], "flappy-bird-gym: A Flappy Bird environment for Gym": [[109, "flappy-bird-gym-a-flappy-bird-environment-for-gym"]], "gym-derk: GPU accelerated MOBA environment": [[109, "gym-derk-gpu-accelerated-moba-environment"]], "SlimeVolleyGym: A simple environment for single and multi-agent reinforcement learning": [[109, "slimevolleygym-a-simple-environment-for-single-and-multi-agent-reinforcement-learning"]], "Unity ML Agents: Environments for Unity game engine": [[109, "unity-ml-agents-environments-for-unity-game-engine"]], "PGE: Parallel Game Engine": [[109, "pge-parallel-game-engine"]], "Robotics environments": [[109, "robotics-environments"]], "gym-jiminy: Training Robots in Jiminy": [[109, "gym-jiminy-training-robots-in-jiminy"]], "gym-pybullet-drones: Environments for quadcopter control": [[109, "gym-pybullet-drones-environments-for-quadcopter-control"]], "MarsExplorer: Environments for controlling robot on Mars": [[109, "marsexplorer-environments-for-controlling-robot-on-mars"]], "panda-gym: Robotics environments using the PyBullet physics engine": [[109, "panda-gym-robotics-environments-using-the-pybullet-physics-engine"]], "robo-gym: Real-world and simulation robotics": [[109, "robo-gym-real-world-and-simulation-robotics"]], "Offworld-gym": [[109, "offworld-gym"]], "safe-control-gym": [[109, "safe-control-gym"]], "gym-softrobot: Soft-robotics environments": [[109, "gym-softrobot-soft-robotics-environments"]], "iGibson": [[109, "igibson"]], "DexterousHands: dual dexterous hand manipulation tasks": [[109, "dexteroushands-dual-dexterous-hand-manipulation-tasks"]], "OmniIsaacGymEnvs": [[109, "omniisaacgymenvs"]], "Autonomous Driving environments": [[109, "autonomous-driving-environments"]], "sumo-rl": [[109, "sumo-rl"]], "gym-duckietown": [[109, "gym-duckietown"]], "gym-electric-motor": [[109, "gym-electric-motor"]], "highway-env": [[109, "highway-env"]], "CommonRoad-RL": [[109, "commonroad-rl"]], "tmrl: TrackMania 2020 through RL": [[109, "tmrl-trackmania-2020-through-rl"]], "racing_dreamer": [[109, "racing-dreamer"]], "l2r: Multimodal control environment where agents learn how to race": [[109, "l2r-multimodal-control-environment-where-agents-learn-how-to-race"]], "racecar_gym": [[109, "racecar-gym"]], "Other environments": [[109, "other-environments"]], "CompilerGym: Optimise compiler tasks": [[109, "compilergym-optimise-compiler-tasks"]], "CARL: context adaptive RL": [[109, "carl-context-adaptive-rl"]], "matrix-mdp: Easily create discrete MDPs": [[109, "matrix-mdp-easily-create-discrete-mdps"]], "mo-gym: Multi-objective Reinforcement Learning environments": [[109, "mo-gym-multi-objective-reinforcement-learning-environments"]], "gym-cellular-automata: Cellular Automata environments": [[109, "gym-cellular-automata-cellular-automata-environments"]], "gym-sokoban: 2D Transportation Puzzles": [[109, "gym-sokoban-2d-transportation-puzzles"]], "DACBench: Benchmark Library for Dynamic Algorithm configuration": [[109, "dacbench-benchmark-library-for-dynamic-algorithm-configuration"]], "NLPGym: A toolkit to develop RL agents to solve NLP tasks": [[109, "nlpgym-a-toolkit-to-develop-rl-agents-to-solve-nlp-tasks"]], "gym-saturation: Environments used to prove theorems": [[109, "gym-saturation-environments-used-to-prove-theorems"]], "ShinRL: Environments for evaluating RL algorithms": [[109, "shinrl-environments-for-evaluating-rl-algorithms"]], "gymnax: Hardware Accelerated RL Environments": [[109, "gymnax-hardware-accelerated-rl-environments"]], "gym-anytrading: Financial trading environments for FOREX and STOCKS": [[109, "gym-anytrading-financial-trading-environments-for-forex-and-stocks"]], "gym-mtsim: Financial trading for MetaTrader 5 platform": [[109, "gym-mtsim-financial-trading-for-metatrader-5-platform"]], "openmodelica-microgrid-gym: Environments for controlling power electronic converters in microgrids": [[109, "openmodelica-microgrid-gym-environments-for-controlling-power-electronic-converters-in-microgrids"]], "mobile-env: Environments for coordination of wireless mobile networks": [[109, "mobile-env-environments-for-coordination-of-wireless-mobile-networks"]], "GymFC: A flight control tuning and training framework": [[109, "gymfc-a-flight-control-tuning-and-training-framework"]], "Toy Text": [[110, "toy-text"]], "Blackjack": [[111, "blackjack"]], "Information": [[111, "information"], [112, "information"], [113, "information"], [114, "information"]], "Cliff Walking": [[112, "cliff-walking"]], "Frozen Lake": [[113, "frozen-lake"]], "Taxi": [[114, "taxi"]], "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments": [[115, "gymnasium-is-a-standard-api-for-reinforcement-learning-and-a-diverse-collection-of-reference-environments"]], "v0.19.0 Release Notes": [[116, "v0-19-0-release-notes"]], "New features": [[116, "new-features"]], "Bug fixes": [[116, "bug-fixes"], [124, "bug-fixes"]], "Other": [[116, "other"]], "v0.20.0 Release Notes": [[117, "v0-20-0-release-notes"]], "Major Change": [[117, "major-change"]], "Breaking changes and new features:": [[117, "breaking-changes-and-new-features"]], "Bug fixes and upgrades": [[117, "bug-fixes-and-upgrades"]], "v0.21.0 Release Notes": [[118, "v0-21-0-release-notes"]], "v0.22 Release Notes": [[119, "v0-22-release-notes"]], "API changes": [[119, "api-changes"]], "Environment changes": [[119, "environment-changes"]], "Other changes": [[119, "other-changes"]], "v0.23.0 Release Notes": [[120, "v0-23-0-release-notes"]], "Breaking changes": [[120, "breaking-changes"]], "v0.23.1 Release Notes": [[121, "v0-23-1-release-notes"]], "v0.24.0 Release Notes": [[122, "v0-24-0-release-notes"]], "Major changes": [[122, "major-changes"], [127, "major-changes"]], "Minor changes": [[122, "minor-changes"], [127, "minor-changes"]], "v0.24.1 Release Notes": [[123, "v0-24-1-release-notes"]], "Bugs fixed": [[123, "bugs-fixed"]], "v0.25.0 Release notes": [[124, "v0-25-0-release-notes"]], "API Changes": [[124, "api-changes"]], "Misc": [[124, "misc"]], "0.25.1 Release Notes": [[125, "release-notes"]], "Bug fix": [[125, "bug-fix"]], "Typos": [[125, "typos"]], "v0.25.2 Release Notes": [[126, "v0-25-2-release-notes"]], "Bug Fixes": [[126, "bug-fixes"], [128, "bug-fixes"]], "Updates": [[126, "updates"]], "v0.26.0 Release Notes": [[127, "v0-26-0-release-notes"]], "Breaking backward compatibility": [[127, "breaking-backward-compatibility"]], "v0.26.1 Release Notes": [[128, "v0-26-1-release-notes"]], "Spelling": [[128, "spelling"]], "v0.26.2 Release Notes": [[129, "v0-26-2-release-notes"]], "Bugs Fixes": [[129, "bugs-fixes"]], "Release Notes": [[130, "release-notes"]], "v0.27.1": [[130, "release-v0-27-1"]], "v0.27.0": [[130, "release-v0-27-0"]], "v0.26.3": [[130, "release-v0-26-3"]], "v0.26.2: 0.26.2 ": [[130, "release-v0-26-2"]], "v0.26.1: 0.26.1": [[130, "release-v0-26-1"]], "v0.26.0: Initial Release": [[130, "release-v0-26-0"]], "Gym Release Notes": [[130, "gym-release-notes"]], "Gymnasium Basics": [[131, "gymnasium-basics"], [135, "gymnasium-basics"], [137, "gymnasium-basics"]], "Make your own custom environment": [[132, "make-your-own-custom-environment"]], "Subclassing gymnasium.Env": [[132, "subclassing-gymnasium-env"]], "Declaration and Initialization": [[132, "declaration-and-initialization"]], "Constructing Observations From Environment States": [[132, "constructing-observations-from-environment-states"]], "Reset": [[132, "reset"]], "Step": [[132, "step"]], "Rendering": [[132, "rendering"]], "Close": [[132, "close"]], "Registering Envs": [[132, "registering-envs"]], "Creating a Package": [[132, "creating-a-package"]], "Creating Environment Instances": [[132, "creating-environment-instances"]], "Using Wrappers": [[132, "using-wrappers"]], "Handling Time Limits": [[133, "handling-time-limits"]], "Termination": [[133, "termination"]], "Truncation": [[133, "truncation"]], "Importance in learning code": [[133, "importance-in-learning-code"]], "Solution": [[133, "solution"]], "Implementing Custom Wrappers": [[134, "implementing-custom-wrappers"]], "Inheriting from gymnasium.ObservationWrapper": [[134, "inheriting-from-gymnasium-observationwrapper"]], "Inheriting from gymnasium.ActionWrapper": [[134, "inheriting-from-gymnasium-actionwrapper"]], "Inheriting from gymnasium.RewardWrapper": [[134, "inheriting-from-gymnasium-rewardwrapper"]], "Inheriting from gymnasium.Wrapper": [[134, "inheriting-from-gymnasium-wrapper"]], "Training A2C with Vector Envs and Domain Randomization": [[136, "training-a2c-with-vector-envs-and-domain-randomization"]], "Introduction": [[136, "introduction"]], "Advantage Actor-Critic (A2C)": [[136, "advantage-actor-critic-a2c"]], "Using Vectorized Environments": [[136, "using-vectorized-environments"]], "Domain Randomization": [[136, "domain-randomization"]], "Setup": [[136, "setup"]], "Training the A2C Agent": [[136, "training-the-a2c-agent"]], "Plotting": [[136, "plotting"]], "Performance Analysis of Synchronous and Asynchronous Vectorized Environments": [[136, "performance-analysis-of-synchronous-and-asynchronous-vectorized-environments"]], "Saving/ Loading Weights": [[136, "saving-loading-weights"]], "Showcase the Agent": [[136, "showcase-the-agent"]], "Try playing the environment yourself": [[136, "try-playing-the-environment-yourself"]], "Tutorials": [[137, "tutorials"]], "Training Agents": [[137, "training-agents"], [138, "training-agents"], [140, "training-agents"]], "Solving Blackjack with Q-Learning": [[139, "solving-blackjack-with-q-learning"]], "Imports and Environment Setup": [[139, "imports-and-environment-setup"]], "Observing the environment": [[139, "observing-the-environment"]], "Executing an action": [[139, "executing-an-action"]], "Building an agent": [[139, "building-an-agent"], [141, "building-an-agent"]], "Visualizing the training": [[139, "visualizing-the-training"]], "Visualising the policy": [[139, "visualising-the-policy"]], "Think you can do better?": [[139, "think-you-can-do-better"]], "Training using REINFORCE for Mujoco": [[141, "training-using-reinforce-for-mujoco"]], "Policy Network": [[141, "policy-network"]], "Plot learning curve": [[141, "plot-learning-curve"]]}, "indexentries": {"env (class in gymnasium)": [[2, "gymnasium.Env"]], "action_space (gymnasium.env attribute)": [[2, "gymnasium.Env.action_space"]], "close() (in module gymnasium.env)": [[2, "gymnasium.Env.close"]], "metadata (gymnasium.env attribute)": [[2, "gymnasium.Env.metadata"]], "np_random (gymnasium.env property)": [[2, "gymnasium.Env.np_random"]], "observation_space (gymnasium.env attribute)": [[2, "gymnasium.Env.observation_space"]], "render() (in module gymnasium.env)": [[2, "gymnasium.Env.render"]], "render_mode (gymnasium.env attribute)": [[2, "gymnasium.Env.render_mode"]], "reset() (in module gymnasium.env)": [[2, "gymnasium.Env.reset"]], "reward_range (gymnasium.env attribute)": [[2, "gymnasium.Env.reward_range"]], "spec (gymnasium.env attribute)": [[2, "gymnasium.Env.spec"]], "step() (in module gymnasium.env)": [[2, "gymnasium.Env.step"]], "unwrapped (gymnasium.env property)": [[2, "gymnasium.Env.unwrapped"]], "funcenv (class in gymnasium.experimental)": [[4, "gymnasium.experimental.FuncEnv"]], "initial() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.initial"]], "observation() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.observation"]], "render_close() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.render_close"]], "render_image() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.render_image"]], "render_init() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.render_init"]], "reward() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.reward"]], "state_info() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.state_info"]], "step_info() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.step_info"]], "terminal() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.terminal"]], "transform() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.transform"]], "transition() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.transition"]], "ataripreprocessingv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.AtariPreprocessingV0"]], "autoresetv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.AutoresetV0"]], "clipactionv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.ClipActionV0"]], "cliprewardv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.ClipRewardV0"]], "delayobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.DelayObservationV0"]], "dtypeobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.DtypeObservationV0"]], "filterobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.FilterObservationV0"]], "flattenobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.FlattenObservationV0"]], "framestackobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.FrameStackObservationV0"]], "grayscaleobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.GrayscaleObservationV0"]], "humanrenderingv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.HumanRenderingV0"]], "jaxtonumpyv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.JaxToNumpyV0"]], "jaxtotorchv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.JaxToTorchV0"]], "lambdaactionv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.LambdaActionV0"]], "lambdaobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.LambdaObservationV0"]], "lambdarewardv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.LambdaRewardV0"]], "normalizeobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.NormalizeObservationV0"]], "normalizerewardv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.NormalizeRewardV0"]], "numpytotorchv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.NumpyToTorchV0"]], "orderenforcingv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.OrderEnforcingV0"]], "passiveenvcheckerv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.PassiveEnvCheckerV0"]], "pixelobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.PixelObservationV0"]], "recordepisodestatisticsv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.RecordEpisodeStatisticsV0"]], "recordvideov0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.RecordVideoV0"]], "rendercollectionv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.RenderCollectionV0"]], "rescaleactionv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.RescaleActionV0"]], "rescaleobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.RescaleObservationV0"]], "reshapeobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.ReshapeObservationV0"]], "resizeobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.ResizeObservationV0"]], "stickyactionv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.StickyActionV0"]], "timeawareobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.TimeAwareObservationV0"]], "make() (in module gymnasium)": [[8, "gymnasium.make"]], "pprint_registry() (in module gymnasium)": [[8, "gymnasium.pprint_registry"]], "register() (in module gymnasium)": [[8, "gymnasium.register"]], "spec() (in module gymnasium)": [[8, "gymnasium.spec"]], "space (class in gymnasium.spaces)": [[9, "gymnasium.spaces.Space"]], "contains() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.contains"]], "dtype (gymnasium.spaces.space property)": [[9, "gymnasium.spaces.Space.dtype"]], "from_jsonable() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.from_jsonable"]], "gymnasium.spaces": [[9, "module-gymnasium.spaces"]], "is_np_flattenable (gymnasium.spaces.space.space property)": [[9, "gymnasium.spaces.space.Space.is_np_flattenable"]], "module": [[9, "module-gymnasium.spaces"], [16, "module-gymnasium.wrappers"]], "sample() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.sample"]], "seed() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.seed"]], "shape (gymnasium.spaces.space.space property)": [[9, "gymnasium.spaces.space.Space.shape"]], "to_jsonable() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.to_jsonable"]], "dict (class in gymnasium.spaces)": [[10, "gymnasium.spaces.Dict"]], "graph (class in gymnasium.spaces)": [[10, "gymnasium.spaces.Graph"]], "sequence (class in gymnasium.spaces)": [[10, "gymnasium.spaces.Sequence"]], "tuple (class in gymnasium.spaces)": [[10, "gymnasium.spaces.Tuple"]], "sample() (gymnasium.spaces.dict method)": [[10, "gymnasium.spaces.Dict.sample"]], "sample() (gymnasium.spaces.graph method)": [[10, "gymnasium.spaces.Graph.sample"]], "sample() (gymnasium.spaces.sequence method)": [[10, "gymnasium.spaces.Sequence.sample"]], "sample() (gymnasium.spaces.tuple method)": [[10, "gymnasium.spaces.Tuple.sample"]], "seed() (gymnasium.spaces.dict method)": [[10, "gymnasium.spaces.Dict.seed"]], "seed() (gymnasium.spaces.graph method)": [[10, "gymnasium.spaces.Graph.seed"]], "seed() (gymnasium.spaces.sequence method)": [[10, "gymnasium.spaces.Sequence.seed"]], "seed() (gymnasium.spaces.tuple method)": [[10, "gymnasium.spaces.Tuple.seed"]], "box (class in gymnasium.spaces)": [[11, "gymnasium.spaces.Box"]], "discrete (class in gymnasium.spaces)": [[11, "gymnasium.spaces.Discrete"]], "multibinary (class in gymnasium.spaces)": [[11, "gymnasium.spaces.MultiBinary"]], "multidiscrete (class in gymnasium.spaces)": [[11, "gymnasium.spaces.MultiDiscrete"]], "text (class in gymnasium.spaces)": [[11, "gymnasium.spaces.Text"]], "is_bounded() (gymnasium.spaces.box method)": [[11, "gymnasium.spaces.Box.is_bounded"]], "sample() (gymnasium.spaces.box method)": [[11, "gymnasium.spaces.Box.sample"]], "sample() (gymnasium.spaces.discrete method)": [[11, "gymnasium.spaces.Discrete.sample"]], "sample() (gymnasium.spaces.multibinary method)": [[11, "gymnasium.spaces.MultiBinary.sample"]], "sample() (gymnasium.spaces.multidiscrete method)": [[11, "gymnasium.spaces.MultiDiscrete.sample"]], "sample() (gymnasium.spaces.text method)": [[11, "gymnasium.spaces.Text.sample"]], "seed() (gymnasium.spaces.box method)": [[11, "gymnasium.spaces.Box.seed"]], "seed() (gymnasium.spaces.discrete method)": [[11, "gymnasium.spaces.Discrete.seed"]], "seed() (gymnasium.spaces.multibinary method)": [[11, "gymnasium.spaces.MultiBinary.seed"]], "seed() (gymnasium.spaces.multidiscrete method)": [[11, "gymnasium.spaces.MultiDiscrete.seed"]], "seed() (gymnasium.spaces.text method)": [[11, "gymnasium.spaces.Text.seed"]], "flatdim() (in module gymnasium.spaces.utils)": [[12, "gymnasium.spaces.utils.flatdim"]], "flatten() (in module gymnasium.spaces.utils)": [[12, "gymnasium.spaces.utils.flatten"]], "flatten_space() (in module gymnasium.spaces.utils)": [[12, "gymnasium.spaces.utils.flatten_space"]], "unflatten() (in module gymnasium.spaces.utils)": [[12, "gymnasium.spaces.utils.unflatten"]], "batch_space() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.batch_space"]], "concatenate() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.concatenate"]], "create_empty_array() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.create_empty_array"]], "create_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.create_shared_memory"]], "iterate() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.iterate"]], "read_from_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.read_from_shared_memory"]], "write_to_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.write_to_shared_memory"]], "playplot (class in gymnasium.utils.play)": [[14, "gymnasium.utils.play.PlayPlot"]], "playablegame (class in gymnasium.utils.play)": [[14, "gymnasium.utils.play.PlayableGame"]], "callback() (gymnasium.utils.play.playplot method)": [[14, "gymnasium.utils.play.PlayPlot.callback"]], "capped_cubic_video_schedule() (in module gymnasium.utils.save_video)": [[14, "gymnasium.utils.save_video.capped_cubic_video_schedule"]], "check_env() (in module gymnasium.utils.env_checker)": [[14, "gymnasium.utils.env_checker.check_env"]], "convert_to_done_step_api() (in module gymnasium.utils.step_api_compatibility)": [[14, "gymnasium.utils.step_api_compatibility.convert_to_done_step_api"]], "convert_to_terminated_truncated_step_api() (in module gymnasium.utils.step_api_compatibility)": [[14, "gymnasium.utils.step_api_compatibility.convert_to_terminated_truncated_step_api"]], "np_random() (in module gymnasium.utils.seeding)": [[14, "gymnasium.utils.seeding.np_random"]], "play() (in module gymnasium.utils.play)": [[14, "gymnasium.utils.play.play"]], "process_event() (gymnasium.utils.play.playablegame method)": [[14, "gymnasium.utils.play.PlayableGame.process_event"]], "save_video() (in module gymnasium.utils.save_video)": [[14, "gymnasium.utils.save_video.save_video"]], "step_api_compatibility() (in module gymnasium.utils.step_api_compatibility)": [[14, "gymnasium.utils.step_api_compatibility.step_api_compatibility"]], "asyncvectorenv (class in gymnasium.vector)": [[15, "gymnasium.vector.AsyncVectorEnv"]], "syncvectorenv (class in gymnasium.vector)": [[15, "gymnasium.vector.SyncVectorEnv"]], "vectorenv (class in gymnasium.vector)": [[15, "gymnasium.vector.VectorEnv"]], "action_space": [[15, "action_space"]], "close() (gymnasium.vector.vectorenv method)": [[15, "gymnasium.vector.VectorEnv.close"]], "make() (in module gymnasium.vector)": [[15, "gymnasium.vector.make"]], "observation_space": [[15, "observation_space"]], "reset() (gymnasium.vector.vectorenv method)": [[15, "gymnasium.vector.VectorEnv.reset"]], "single_action_space": [[15, "single_action_space"]], "single_observation_space": [[15, "single_observation_space"]], "step() (gymnasium.vector.vectorenv method)": [[15, "gymnasium.vector.VectorEnv.step"]], "wrapper (class in gymnasium)": [[16, "gymnasium.Wrapper"]], "action_space (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.action_space"]], "close() (in module gymnasium.wrapper)": [[16, "gymnasium.Wrapper.close"]], "env (gymnasium.wrappers.gymnasium.wrapper attribute)": [[16, "gymnasium.wrappers.gymnasium.Wrapper.env"]], "gymnasium.wrappers": [[16, "module-gymnasium.wrappers"]], "metadata (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.metadata"]], "np_random (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.np_random"]], "observation_space (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.observation_space"]], "reset() (in module gymnasium.wrapper)": [[16, "gymnasium.Wrapper.reset"]], "reward_range (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.reward_range"]], "spec (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.spec"]], "step() (in module gymnasium.wrapper)": [[16, "gymnasium.Wrapper.step"]], "unwrapped (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.unwrapped"]], "actionwrapper (class in gymnasium)": [[17, "gymnasium.ActionWrapper"]], "clipaction (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.ClipAction"]], "rescaleaction (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.RescaleAction"]], "action() (gymnasium.actionwrapper method)": [[17, "gymnasium.ActionWrapper.action"]], "ataripreprocessing (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.AtariPreprocessing"]], "autoresetwrapper (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.AutoResetWrapper"]], "envcompatibility (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.EnvCompatibility"]], "humanrendering (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.HumanRendering"]], "orderenforcing (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.OrderEnforcing"]], "passiveenvchecker (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.PassiveEnvChecker"]], "recordepisodestatistics (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.RecordEpisodeStatistics"]], "recordvideo (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.RecordVideo"]], "rendercollection (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.RenderCollection"]], "stepapicompatibility (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.StepAPICompatibility"]], "timelimit (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.TimeLimit"]], "vectorlistinfo (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.VectorListInfo"]], "filterobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.FilterObservation"]], "flattenobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.FlattenObservation"]], "framestack (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.FrameStack"]], "grayscaleobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.GrayScaleObservation"]], "normalizeobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.NormalizeObservation"]], "observationwrapper (class in gymnasium)": [[19, "gymnasium.ObservationWrapper"]], "pixelobservationwrapper (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.PixelObservationWrapper"]], "resizeobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.ResizeObservation"]], "timeawareobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.TimeAwareObservation"]], "transformobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.TransformObservation"]], "observation() (gymnasium.observationwrapper method)": [[19, "gymnasium.ObservationWrapper.observation"]], "normalizereward (class in gymnasium.wrappers)": [[20, "gymnasium.wrappers.NormalizeReward"]], "rewardwrapper (class in gymnasium)": [[20, "gymnasium.RewardWrapper"]], "transformreward (class in gymnasium.wrappers)": [[20, "gymnasium.wrappers.TransformReward"]], "reward() (gymnasium.rewardwrapper method)": [[20, "gymnasium.RewardWrapper.reward"]]}}) |