diff --git a/main/environments/mujoco/index.html b/main/environments/mujoco/index.html index dd6f968a0..2a8345127 100644 --- a/main/environments/mujoco/index.html +++ b/main/environments/mujoco/index.html @@ -490,6 +490,18 @@ + +
+
+ +
+
+ Pusher +
+
+
+ +
diff --git a/main/searchindex.js b/main/searchindex.js index fa5419aaf..f0b5418d5 100644 --- a/main/searchindex.js +++ b/main/searchindex.js @@ -1 +1 @@ -Search.setIndex({"docnames": ["404", "README", "api/env", "api/experimental", "api/experimental/functional", "api/experimental/vector", "api/experimental/vector_wrappers", "api/experimental/wrappers", "api/registry", "api/spaces", "api/spaces/composite", "api/spaces/fundamental", "api/spaces/utils", "api/spaces/vector_utils", "api/utils", "api/vector", "api/wrappers", "api/wrappers/action_wrappers", "api/wrappers/misc_wrappers", "api/wrappers/observation_wrappers", "api/wrappers/reward_wrappers", "content/basic_usage", "content/gym_compatibility", "content/migration-guide", "environments/atari", "environments/atari/adventure", "environments/atari/air_raid", "environments/atari/alien", "environments/atari/amidar", "environments/atari/assault", "environments/atari/asterix", "environments/atari/asteroids", "environments/atari/atlantis", "environments/atari/bank_heist", "environments/atari/battle_zone", "environments/atari/beam_rider", "environments/atari/berzerk", "environments/atari/bowling", "environments/atari/boxing", "environments/atari/breakout", "environments/atari/carnival", "environments/atari/centipede", "environments/atari/chopper_command", "environments/atari/complete_list", "environments/atari/crazy_climber", "environments/atari/defender", "environments/atari/demon_attack", "environments/atari/double_dunk", "environments/atari/elevator_action", "environments/atari/enduro", "environments/atari/fishing_derby", "environments/atari/freeway", "environments/atari/frostbite", "environments/atari/gopher", "environments/atari/gravitar", "environments/atari/hero", "environments/atari/ice_hockey", "environments/atari/jamesbond", "environments/atari/journey_escape", "environments/atari/kangaroo", "environments/atari/krull", "environments/atari/kung_fu_master", "environments/atari/montezuma_revenge", "environments/atari/ms_pacman", "environments/atari/name_this_game", "environments/atari/phoenix", "environments/atari/pitfall", "environments/atari/pong", "environments/atari/pooyan", "environments/atari/private_eye", "environments/atari/qbert", "environments/atari/riverraid", "environments/atari/road_runner", "environments/atari/robotank", "environments/atari/seaquest", "environments/atari/skiing", "environments/atari/solaris", "environments/atari/space_invaders", "environments/atari/star_gunner", "environments/atari/tennis", "environments/atari/time_pilot", "environments/atari/tutankham", "environments/atari/up_n_down", "environments/atari/venture", "environments/atari/video_pinball", "environments/atari/wizard_of_wor", "environments/atari/zaxxon", "environments/box2d", "environments/box2d/bipedal_walker", "environments/box2d/car_racing", "environments/box2d/lunar_lander", "environments/classic_control", "environments/classic_control/acrobot", "environments/classic_control/cart_pole", "environments/classic_control/mountain_car", "environments/classic_control/mountain_car_continuous", "environments/classic_control/pendulum", "environments/mujoco", "environments/mujoco/ant", "environments/mujoco/half_cheetah", "environments/mujoco/hopper", "environments/mujoco/humanoid", "environments/mujoco/humanoid_standup", "environments/mujoco/inverted_double_pendulum", "environments/mujoco/inverted_pendulum", "environments/mujoco/pusher", "environments/mujoco/reacher", "environments/mujoco/swimmer", "environments/mujoco/walker2d", "environments/third_party_environments", "environments/toy_text", "environments/toy_text/blackjack", "environments/toy_text/cliff_walking", "environments/toy_text/frozen_lake", "environments/toy_text/taxi", "index", "tutorials/blackjack_tutorial", "tutorials/environment_creation", "tutorials/handling_time_limits", "tutorials/reinforce_invpend_gym_v26"], "filenames": ["404.md", "README.md", "api/env.md", "api/experimental.md", "api/experimental/functional.md", "api/experimental/vector.md", "api/experimental/vector_wrappers.md", "api/experimental/wrappers.md", "api/registry.md", "api/spaces.md", "api/spaces/composite.md", "api/spaces/fundamental.md", "api/spaces/utils.md", "api/spaces/vector_utils.md", "api/utils.md", "api/vector.md", "api/wrappers.md", "api/wrappers/action_wrappers.md", "api/wrappers/misc_wrappers.md", "api/wrappers/observation_wrappers.md", "api/wrappers/reward_wrappers.md", "content/basic_usage.md", "content/gym_compatibility.md", "content/migration-guide.md", "environments/atari.md", "environments/atari/adventure.md", "environments/atari/air_raid.md", "environments/atari/alien.md", "environments/atari/amidar.md", "environments/atari/assault.md", "environments/atari/asterix.md", "environments/atari/asteroids.md", "environments/atari/atlantis.md", "environments/atari/bank_heist.md", "environments/atari/battle_zone.md", "environments/atari/beam_rider.md", "environments/atari/berzerk.md", "environments/atari/bowling.md", "environments/atari/boxing.md", "environments/atari/breakout.md", "environments/atari/carnival.md", "environments/atari/centipede.md", "environments/atari/chopper_command.md", "environments/atari/complete_list.md", "environments/atari/crazy_climber.md", "environments/atari/defender.md", "environments/atari/demon_attack.md", "environments/atari/double_dunk.md", "environments/atari/elevator_action.md", "environments/atari/enduro.md", "environments/atari/fishing_derby.md", "environments/atari/freeway.md", "environments/atari/frostbite.md", "environments/atari/gopher.md", "environments/atari/gravitar.md", "environments/atari/hero.md", "environments/atari/ice_hockey.md", "environments/atari/jamesbond.md", "environments/atari/journey_escape.md", "environments/atari/kangaroo.md", "environments/atari/krull.md", "environments/atari/kung_fu_master.md", "environments/atari/montezuma_revenge.md", "environments/atari/ms_pacman.md", "environments/atari/name_this_game.md", "environments/atari/phoenix.md", "environments/atari/pitfall.md", "environments/atari/pong.md", "environments/atari/pooyan.md", "environments/atari/private_eye.md", "environments/atari/qbert.md", "environments/atari/riverraid.md", "environments/atari/road_runner.md", "environments/atari/robotank.md", "environments/atari/seaquest.md", "environments/atari/skiing.md", "environments/atari/solaris.md", "environments/atari/space_invaders.md", "environments/atari/star_gunner.md", "environments/atari/tennis.md", "environments/atari/time_pilot.md", "environments/atari/tutankham.md", "environments/atari/up_n_down.md", "environments/atari/venture.md", "environments/atari/video_pinball.md", "environments/atari/wizard_of_wor.md", "environments/atari/zaxxon.md", "environments/box2d.md", "environments/box2d/bipedal_walker.md", "environments/box2d/car_racing.md", "environments/box2d/lunar_lander.md", "environments/classic_control.md", "environments/classic_control/acrobot.md", "environments/classic_control/cart_pole.md", "environments/classic_control/mountain_car.md", "environments/classic_control/mountain_car_continuous.md", "environments/classic_control/pendulum.md", "environments/mujoco.md", "environments/mujoco/ant.md", "environments/mujoco/half_cheetah.md", "environments/mujoco/hopper.md", "environments/mujoco/humanoid.md", "environments/mujoco/humanoid_standup.md", "environments/mujoco/inverted_double_pendulum.md", "environments/mujoco/inverted_pendulum.md", "environments/mujoco/pusher.md", "environments/mujoco/reacher.md", "environments/mujoco/swimmer.md", "environments/mujoco/walker2d.md", "environments/third_party_environments.md", "environments/toy_text.md", "environments/toy_text/blackjack.md", "environments/toy_text/cliff_walking.md", "environments/toy_text/frozen_lake.md", "environments/toy_text/taxi.md", "index.md", "tutorials/blackjack_tutorial.rst", "tutorials/environment_creation.rst", "tutorials/handling_time_limits.rst", "tutorials/reinforce_invpend_gym_v26.rst"], "titles": ["404 - Page Not Found", "Gymnasium-docs", "Env", "Experimental", "Functional Environment", "Vectorizing Environment", "Vector Environment Wrappers", "Wrappers", "Registry", "Spaces", "Composite Spaces", "Fundamental Spaces", "Spaces Utils", "Spaces Vector Utils", "Utils", "Vector", "Wrappers", "Action Wrappers", "Misc Wrappers", "Observation Wrappers", "Reward Wrappers", "Basic Usage", "Compatibility with Gym", "v21 to v26 Migration Guide", "Atari", "Adventure", "Air Raid", "Alien", "Amidar", "Assault", "Asterix", "Asteroids", "Atlantis", "Bank Heist", "Battle Zone", "Beam Rider", "Berzerk", "Bowling", "Boxing", "Breakout", "Carnival", "Centipede", "Chopper Command", "Complete List - Atari", "Crazy Climber", "Defender", "Demon Attack", "Double Dunk", "Elevator Action", "Enduro", "FishingDerby", "Freeway", "Frostbite", "Gopher", "Gravitar", "Hero", "IceHockey", "Jamesbond", "JourneyEscape", "Kangaroo", "Krull", "Kung Fu Master", "Montezuma Revenge", "Ms Pacman", "Name This Game", "Phoenix", "Pitfall", "Pong", "Pooyan", "PrivateEye", "Qbert", "Riverraid", "Road Runner", "Robot Tank", "Seaquest", "Skiings", "Solaris", "SpaceInvaders", "StarGunner", "Tennis", "TimePilot", "Tutankham", "Up n\u2019 Down", "Venture", "Video Pinball", "Wizard of Wor", "Zaxxon", "Box2D", "Bipedal Walker", "Car Racing", "Lunar Lander", "Classic Control", "Acrobot", "Cart Pole", "Mountain Car", "Mountain Car Continuous", "Pendulum", "MuJoCo", "Ant", "Half Cheetah", "Hopper", "Humanoid", "Humanoid Standup", "Inverted Double Pendulum", "Inverted Pendulum", "Pusher", "Reacher", "Swimmer", "Walker2D", "Third-party Environments", "Toy Text", "Blackjack", "Cliff Walking", "Frozen Lake", "Taxi", "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments", "Solving Blackjack with Q-Learning", "Make your own custom environment", "Handling Time Limits", "Training using REINFORCE for Mujoco"], "terms": {"thi": [1, 2, 3, 4, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 115, 116, 117, 118, 119], "folder": [1, 14, 18, 105, 106], "contain": [1, 2, 3, 9, 12, 13, 15, 16, 18, 19, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 100, 101, 105, 106, 107, 108, 109, 111, 114, 116, 117, 119], "If": [1, 2, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 30, 33, 38, 41, 50, 51, 52, 53, 54, 68, 75, 79, 88, 89, 90, 95, 98, 100, 101, 102, 106, 108, 111, 112, 113, 116, 117], "you": [1, 2, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 98, 101, 102, 105, 106, 109, 115, 117, 118], "ar": [1, 2, 3, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 116, 117, 118, 119], "pleas": [1, 2, 14, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "pr": [1, 23, 109], "repo": [1, 24], "otherwis": [1, 2, 8, 10, 11, 14, 15, 18, 19, 24, 37, 109, 116], "follow": [1, 4, 8, 9, 14, 16, 17, 18, 20, 21, 24, 37, 47, 49, 50, 51, 52, 53, 54, 79, 92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 117, 118, 119], "below": [1, 11, 16, 21, 50, 88, 90, 96, 105, 108, 116, 118], "directli": [1, 10, 16, 18, 21, 92, 109, 116, 117, 119], "markdown": 1, "file": [1, 92, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 117], "repositori": [1, 16, 97], "fork": [1, 23, 109, 115], "docstr": 1, "": [1, 2, 4, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 24, 44, 50, 51, 52, 53, 54, 56, 57, 60, 61, 62, 67, 68, 70, 87, 88, 89, 90, 91, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119], "python": [1, 8, 13, 18, 21, 88, 89, 90, 115, 116, 117, 118, 119], "Then": [1, 16, 17, 21, 74, 107], "pip": [1, 24, 87, 91, 97, 117], "instal": [1, 14, 18, 32, 87, 91, 97, 117], "your": [1, 2, 15, 16, 17, 18, 19, 20, 21, 27, 28, 30, 32, 33, 35, 37, 38, 39, 41, 47, 49, 50, 51, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 67, 69, 70, 71, 72, 73, 74, 75, 76, 77, 80, 81, 82, 83, 84, 85, 86, 89, 98, 101, 102, 115, 116], "run": [1, 2, 8, 15, 18, 33, 55, 58, 66, 71, 72, 75, 76, 88, 90, 92, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 112, 117], "script": [1, 116], "gen_md": 1, "py": [1, 13, 24, 88, 89, 90, 97, 98, 101, 102, 112, 116, 117, 118, 119], "automat": [1, 2, 8, 15, 16, 18, 22, 23, 117], "gener": [1, 2, 9, 10, 11, 14, 15, 16, 18, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 115, 117], "For": [1, 2, 4, 11, 12, 14, 16, 18, 19, 21, 22, 23, 24, 25, 27, 28, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 45, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 89, 90, 97, 112, 113, 114, 116, 117], "add": [1, 8, 14, 15, 19, 21, 89, 97, 101, 102, 114, 116, 117], "complet": [1, 16, 18, 21, 23, 24, 44, 57, 69, 70, 89, 90, 116, 118], "ensur": [1, 2, 8, 10, 12, 14, 21, 116, 117], "i": [1, 2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 117, 118, 119], "ha": [1, 2, 3, 9, 11, 12, 14, 16, 18, 19, 20, 21, 23, 24, 54, 74, 88, 89, 90, 91, 97, 98, 99, 100, 101, 102, 105, 106, 107, 108, 109, 111, 115, 116, 117, 118, 119], "properli": [1, 9], "format": [1, 9, 14, 16, 18, 19, 21], "md": [1, 117], "correspond": [1, 2, 8, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 93, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 114, 117, 119], "gif": [1, 92], "_static": 1, "video": [1, 16, 43, 73, 88], "env_typ": 1, "where": [1, 3, 7, 8, 10, 11, 12, 14, 16, 18, 19, 21, 23, 24, 47, 89, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 116, 117, 118, 119], "categori": 1, "e": [1, 2, 3, 9, 11, 12, 13, 15, 16, 18, 19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 105, 106, 109, 111, 113, 116, 117, 119], "g": [1, 2, 9, 11, 12, 13, 15, 16, 75, 92, 96, 109, 113, 114, 116, 117, 119], "mujoco": [1, 16, 21, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "snake_cas": 1, "name": [1, 3, 4, 8, 16, 43, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 117], "convent": [1, 2, 24], "altern": [1, 24], "gen_gif": 1, "index": [1, 13, 14, 18, 19, 21, 24, 93, 102], "toctre": 1, "requir": [1, 2, 9, 19, 97, 116, 119], "packag": [1, 18, 109], "cd": [1, 117], "r": [1, 7, 11, 18, 20, 73, 92, 96, 109, 111, 112, 114, 119], "txt": 1, "To": [1, 8, 13, 15, 18, 19, 20, 21, 22, 23, 24, 32, 42, 70, 88, 89, 90, 92, 114, 116, 117, 119], "builder": 1, "onc": [1, 18, 31, 41, 48, 55, 103, 106, 114, 116, 117], "make": [1, 2, 7, 10, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 116, 119], "dirhtml": 1, "_build": 1, "rebuild": [1, 32], "everi": [1, 14, 18, 21, 41, 42, 46, 51, 73, 74, 83, 89, 90, 93, 98, 100, 101, 108, 109, 117, 119], "time": [1, 2, 8, 10, 14, 15, 16, 24, 40, 43, 46, 47, 48, 52, 56, 58, 59, 66, 70, 71, 72, 73, 74, 75, 88, 89, 96, 98, 99, 100, 101, 102, 107, 108, 109, 112, 114, 116, 117, 119], "chang": [1, 2, 3, 4, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 52, 60, 70, 89, 92, 93, 94, 95, 96, 97, 105, 106, 109, 114, 116, 117, 119], "made": [1, 3, 105, 106], "sphinx": 1, "autobuild": 1, "b": [1, 11, 105, 106, 114], "we": [1, 2, 3, 4, 11, 18, 19, 20, 21, 23, 24, 98, 101, 102, 116, 117, 118, 119], "us": [1, 2, 3, 4, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 113, 114, 116, 118], "galleri": 1, "insid": [1, 10, 11, 18, 117], "directori": 1, "check": [1, 2, 11, 18, 114, 116, 117], "demo": 1, "see": [1, 2, 9, 14, 15, 21, 23, 24, 25, 28, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 45, 55, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 90, 92, 98, 99, 100, 101, 107, 108, 109, 113, 117], "exampl": [1, 2, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 89, 92, 111, 112, 113, 116, 117, 118], "more": [1, 2, 3, 9, 10, 11, 14, 15, 16, 19, 23, 24, 25, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 45, 50, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88, 90, 97, 98, 101, 102, 103, 104, 105, 106, 107, 109, 116, 117, 118, 119], "inform": [1, 2, 9, 10, 11, 14, 15, 16, 18, 19, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 116, 117, 118, 119], "convert": [1, 8, 9, 10, 16, 18, 19, 22, 23, 89, 116], "jupyt": [1, 116, 117, 118, 119], "notebook": [1, 116, 117, 118, 119], "can": [1, 2, 3, 8, 9, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 117, 119], "want": [1, 2, 10, 15, 16, 17, 18, 20, 21, 33, 55, 116, 117], "execut": [1, 14, 17, 24, 47, 114, 117, 119], "which": [1, 2, 8, 9, 10, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 44, 46, 48, 62, 89, 90, 92, 93, 97, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 109, 112, 113, 114, 117, 118, 119], "output": [1, 13, 14, 18, 21, 116, 119], "plot": [1, 14, 116], "should": [1, 2, 9, 11, 14, 15, 18, 19, 21, 23, 105, 106, 116, 117], "start": [1, 2, 9, 11, 14, 15, 18, 34, 47, 48, 54, 58, 59, 74, 116, 119], "run_": 1, "note": [1, 9, 13, 18, 92, 93, 98, 101, 102, 114, 116, 118, 119], "so": [1, 14, 15, 16, 18, 19, 21, 24, 52, 75, 90, 91, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 113, 116, 117, 118], "sure": [1, 2, 18, 117], "doesn": [1, 2, 8, 16, 18, 24, 90, 118], "t": [1, 2, 8, 10, 12, 14, 16, 18, 19, 20, 23, 24, 40, 50, 51, 52, 53, 54, 73, 74, 89, 90, 94, 95, 114, 116, 117, 118], "take": [1, 2, 4, 7, 8, 11, 12, 14, 15, 16, 17, 18, 21, 23, 24, 77, 91, 93, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 114, 116, 119], "than": [1, 23, 50, 56, 74, 90, 92, 93, 94, 95, 99, 103, 104, 105, 107, 109, 111, 116], "few": [1, 92, 116], "second": [1, 10, 14, 15, 37, 68, 75, 90, 99, 103, 106, 107], "class": [2, 3, 4, 7, 9, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 97, 116, 117, 119], "The": [2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 115, 116, 117, 118, 119], "main": [2, 90, 100, 108], "reinforc": [2, 9, 21, 92, 107, 110, 111, 112, 114, 116, 118], "learn": [2, 9, 10, 18, 19, 20, 21, 24, 50, 51, 52, 53, 54, 88, 89, 90, 92, 93, 94, 95, 99, 102, 103, 104, 107, 110, 111, 112, 114, 117], "agent": [2, 3, 9, 16, 18, 19, 21, 23, 24, 48, 57, 88, 89, 90, 94, 98, 99, 100, 101, 102, 103, 104, 107, 108, 117, 118], "encapsul": 2, "an": [2, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 105, 106, 107, 108, 109, 111, 112, 113, 114, 117, 118], "arbitrari": [2, 8, 11, 14, 19, 20, 109], "behind": [2, 68], "scene": [2, 68, 109], "dynam": [2, 24, 39, 50, 51, 52, 53, 54, 92, 96, 97, 103], "through": [2, 8, 9, 15, 22, 23, 24, 39, 55, 58, 61, 62, 66, 75, 76, 101, 102, 118], "step": [2, 7, 8, 15, 16, 17, 18, 19, 20, 21, 24, 88, 90, 92, 93, 96, 112, 113, 114, 115, 116, 118, 119], "reset": [2, 7, 8, 14, 15, 16, 18, 19, 20, 21, 92, 93, 94, 95, 96, 109, 112, 113, 114, 115, 116, 119], "function": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 90, 96, 106, 109, 113, 114, 116, 118, 119], "partial": 2, "fulli": 2, "observ": [2, 4, 9, 10, 13, 14, 15, 16, 17, 18, 20, 23, 109, 115, 118, 119], "singl": [2, 4, 9, 10, 11, 12, 13, 14, 15, 19, 21, 100, 101, 102, 108, 117, 119], "multi": [2, 11, 97, 101, 102, 105], "pettingzoo": 2, "api": [2, 4, 16, 18, 21, 23, 117, 118], "user": [2, 4, 8, 15, 21, 23, 24, 92, 93, 94, 95, 96, 109, 117, 119], "need": [2, 8, 9, 10, 14, 16, 17, 18, 19, 21, 23, 42, 44, 49, 55, 59, 69, 74, 88, 90, 93, 97, 116, 117, 118], "know": [2, 18, 21, 117], "updat": [2, 14, 18, 19, 21, 22, 23, 114, 116, 117, 118, 119], "action": [2, 4, 8, 9, 10, 11, 14, 15, 16, 18, 23, 43, 91, 109, 110, 115, 117, 119], "return": [2, 4, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 112, 113, 114, 116, 117, 118, 119], "next": [2, 4, 13, 21, 23, 44, 46, 48, 119], "reward": [2, 4, 8, 14, 15, 16, 18, 21, 23, 97, 109, 115, 116, 117, 118, 119], "termin": [2, 4, 8, 14, 15, 16, 18, 20, 21, 22, 23, 92, 93, 94, 95, 98, 100, 101, 102, 103, 104, 105, 106, 108, 111, 112, 113, 114, 115, 116, 117, 119], "truncat": [2, 8, 14, 15, 16, 18, 20, 21, 22, 23, 92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 113, 114, 115, 116, 117, 119], "due": [2, 23, 113, 118], "latest": [2, 119], "from": [2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 26, 40, 47, 52, 53, 56, 58, 67, 68, 80, 86, 88, 89, 90, 92, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 118, 119], "about": [2, 4, 14, 19, 21, 69, 92, 98, 101, 102, 116, 117, 118, 119], "metric": [2, 14, 23], "debug": [2, 9, 14, 110], "info": [2, 4, 14, 15, 16, 19, 20, 21, 23, 98, 99, 100, 101, 105, 106, 107, 108, 114, 115, 116, 117, 118, 119], "initi": [2, 4, 7, 8, 10, 11, 15, 16, 17, 18, 19, 20, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 119], "state": [2, 4, 16, 18, 19, 21, 23, 24, 91, 97, 109, 110, 116, 118, 119], "befor": [2, 8, 14, 15, 16, 17, 18, 19, 20, 32, 44, 58, 69, 76, 77, 89, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 117, 119], "call": [2, 3, 8, 12, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 37, 56, 105, 106, 111, 113, 116, 117], "first": [2, 14, 15, 16, 18, 19, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 117, 119], "episod": [2, 8, 14, 16, 19, 23, 116, 117, 118, 119], "render": [2, 4, 15, 16, 19, 21, 24, 87, 88, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 116], "help": [2, 9, 21, 27, 59, 62, 105, 116], "visualis": [2, 21], "what": [2, 9, 18, 24, 112], "mode": [2, 15, 16, 18, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 116, 117], "human": [2, 10, 16, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 101, 102, 105, 115, 117], "rgb_arrai": [2, 14, 16, 18, 19, 24, 117], "ansi": [2, 117], "text": [2, 9, 10, 12, 21, 111, 112, 113, 114], "close": [2, 4, 11, 14, 15, 16, 21, 23, 44, 69, 98, 100, 101, 106, 108, 115, 116], "import": [2, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 117, 119], "when": [2, 9, 10, 12, 13, 14, 15, 16, 18, 19, 20, 22, 24, 27, 40, 44, 45, 46, 48, 50, 51, 52, 53, 54, 56, 57, 71, 72, 73, 74, 77, 89, 90, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 112, 113, 114, 117, 118, 119], "extern": [2, 23, 98, 101, 102, 118], "softwar": [2, 109], "pygam": [2, 14, 23, 87, 117], "databas": 2, "have": [2, 8, 11, 12, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 30, 32, 33, 37, 39, 41, 42, 44, 45, 50, 51, 52, 53, 54, 55, 58, 59, 60, 64, 66, 68, 74, 76, 87, 88, 89, 92, 98, 99, 100, 101, 102, 104, 105, 107, 108, 109, 111, 113, 114, 116, 117, 118, 119], "understand": [2, 12, 15, 105, 109, 119], "action_spac": [2, 14, 15, 16, 17, 19, 20, 21, 23, 114, 115, 116, 117, 119], "space": [2, 3, 14, 15, 16, 17, 18, 19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 97, 109, 110, 117, 119], "object": [2, 9, 13, 16, 21, 25, 30, 44, 50, 51, 59, 71, 77, 105, 116, 119], "valid": [2, 8, 9, 11, 13, 15, 16, 17, 18, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 116], "all": [2, 3, 10, 11, 15, 16, 18, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 51, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 89, 90, 91, 92, 93, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 116, 119], "within": [2, 9, 17, 19, 21, 23, 62, 66, 90, 91, 103, 104], "observation_spac": [2, 10, 11, 15, 16, 19, 21, 117, 119], "reward_rang": [2, 16, 20], "A": [2, 4, 7, 9, 10, 11, 12, 14, 15, 17, 18, 19, 20, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 92, 93, 95, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 112, 113, 116, 117, 118, 119], "tupl": [2, 4, 9, 11, 12, 13, 14, 16, 19, 21, 23, 24, 98, 100, 101, 108, 111, 116, 117, 119], "minimum": [2, 11, 96], "maximum": [2, 8, 11, 14, 18, 21, 73, 74, 90, 92, 96, 103, 117], "possibl": [2, 10, 11, 12, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 93, 94, 95, 99, 101, 103, 104, 107, 108, 109, 112, 113, 114, 116, 117], "over": [2, 13, 18, 20, 27, 33, 56, 66, 71, 99, 101, 111, 113, 116], "default": [2, 8, 9, 10, 11, 14, 15, 16, 18, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 92, 96, 98, 99, 100, 101, 105, 106, 107, 108, 117, 118], "rang": [2, 13, 14, 16, 17, 18, 20, 21, 22, 23, 24, 56, 88, 91, 92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 116, 117, 119], "set": [2, 10, 11, 15, 16, 17, 18, 19, 23, 24, 25, 26, 27, 28, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 83, 84, 85, 87, 90, 91, 92, 94, 95, 97, 98, 99, 100, 101, 105, 106, 107, 108, 109, 113, 116, 117, 118, 119], "infti": [2, 11], "spec": [2, 15, 16, 18], "metadata": [2, 14, 16, 18, 24, 117], "fp": [2, 14, 24, 117], "np_random": [2, 14, 16, 18, 23, 117], "random": [2, 9, 10, 11, 14, 18, 19, 21, 24, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 106, 107, 108, 109, 113, 114, 116, 117, 119], "number": [2, 3, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 21, 22, 24, 26, 27, 28, 29, 30, 31, 32, 35, 36, 37, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 58, 61, 63, 64, 65, 67, 68, 70, 73, 75, 77, 78, 80, 81, 82, 84, 85, 89, 90, 92, 100, 101, 102, 107, 108, 109, 111, 113, 117, 119], "assign": [2, 75, 93, 94, 95, 105, 106], "dure": [2, 10, 11, 15, 16, 18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 98, 99, 100, 101, 107, 108, 114, 117], "super": [2, 16, 17, 19, 20, 23, 117, 119], "seed": [2, 8, 9, 10, 11, 15, 16, 21, 72, 115, 117, 119], "assess": 2, "self": [2, 4, 9, 10, 16, 17, 18, 19, 20, 95, 109, 116, 117, 119], "modifi": [2, 7, 9, 15, 16, 17, 19, 20, 23, 92, 105, 106, 114, 117], "extend": 2, "wrapper": [2, 8, 10, 11, 14, 15, 21, 22, 23, 105, 106, 109, 113, 114, 115, 116, 119], "acttyp": [2, 4, 14, 16, 17, 19, 20], "obstyp": [2, 4, 14, 16, 17, 19, 20, 23, 119], "supportsfloat": [2, 8, 11, 16, 20, 23, 119], "bool": [2, 8, 9, 11, 14, 15, 16, 18, 19, 23, 24, 90, 98, 99, 100, 101, 107, 108, 116, 117, 119], "dict": [2, 4, 8, 9, 11, 12, 13, 14, 15, 16, 18, 19, 21, 23, 112, 113, 114, 117, 119], "str": [2, 4, 8, 9, 10, 11, 12, 14, 15, 16, 18, 19, 23, 24, 98, 99, 100, 101, 107, 108, 116, 119], "ani": [2, 4, 7, 8, 9, 10, 11, 12, 13, 14, 16, 18, 19, 23, 24, 46, 50, 51, 52, 53, 54, 55, 73, 90, 93, 98, 100, 101, 102, 103, 104, 105, 106, 107, 108, 113, 116, 117, 118, 119], "one": [2, 10, 11, 12, 14, 15, 16, 18, 19, 21, 22, 23, 26, 27, 28, 32, 37, 44, 47, 48, 60, 69, 70, 71, 73, 74, 79, 92, 93, 94, 95, 96, 98, 100, 102, 103, 104, 106, 107, 111, 114, 116, 118, 119], "timestep": [2, 18, 19, 21, 94, 95, 98, 100, 101, 102, 103, 104, 105, 106, 108, 117, 119], "end": [2, 4, 16, 18, 21, 32, 41, 42, 44, 46, 48, 49, 57, 58, 59, 69, 73, 76, 77, 88, 96, 116, 118, 119], "reach": [2, 16, 32, 34, 44, 47, 48, 65, 68, 76, 77, 91, 92, 93, 94, 95, 98, 100, 101, 102, 103, 104, 105, 106, 108, 112, 113, 114, 116, 117, 118, 119], "necessari": [2, 9, 24, 50, 51, 52, 53, 54], "version": [2, 3, 8, 9, 16, 93, 116, 117, 118], "0": [2, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116, 117, 118, 119], "26": [2, 22, 98, 101, 102, 117, 118, 119], "wa": [2, 14, 15, 16, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 100, 101, 107, 108, 118, 119], "remov": [2, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 114], "done": [2, 8, 14, 16, 18, 21, 22, 23, 98, 100, 101, 102, 103, 104, 108, 116, 117, 118, 119], "favor": 2, "clearer": 2, "had": 2, "critic": [2, 18], "bootstrap": [2, 23, 118], "algorithm": [2, 9, 97, 110, 114, 116, 118, 119], "paramet": [2, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 107, 108, 117, 119], "provid": [2, 3, 7, 9, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 24, 30, 44, 46, 50, 51, 52, 53, 54, 88, 92, 109, 117], "element": [2, 9, 10, 11, 13, 15, 19, 21, 93, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 117], "numpi": [2, 3, 4, 9, 11, 13, 15, 16, 17, 19, 23, 109, 116, 117, 119], "arrai": [2, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 90, 109, 116, 117, 119], "posit": [2, 10, 11, 12, 13, 14, 18, 19, 21, 24, 35, 56, 88, 89, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 112, 113, 114, 116, 117], "veloc": [2, 10, 12, 13, 88, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "pole": [2, 75, 91, 103, 104, 109, 119], "cartpol": [2, 7, 8, 14, 15, 18, 19, 20, 21, 91, 93, 103, 104, 109, 119], "result": [2, 3, 12, 14, 15, 21, 92, 98, 101, 102, 110, 112, 114, 116], "whether": [2, 4, 8, 11, 14, 18, 23, 37, 90, 98, 99, 100, 101, 107, 108, 111, 116, 117, 118, 119], "defin": [2, 4, 9, 12, 16, 17, 18, 19, 20, 21, 96, 101, 117, 118], "under": [2, 19, 20, 116, 119], "mdp": [2, 18, 21, 94, 95], "task": [2, 10, 16, 19, 21, 60, 66, 69, 89, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 114, 117, 118, 119], "neg": [2, 11, 14, 21, 75, 95, 98, 99, 101, 102, 103, 105, 106, 114, 119], "goal": [2, 27, 30, 35, 37, 39, 41, 44, 56, 61, 62, 63, 64, 65, 67, 70, 72, 74, 75, 81, 82, 83, 84, 85, 86, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 117, 119], "move": [2, 3, 16, 20, 21, 23, 26, 29, 30, 39, 40, 54, 57, 68, 71, 74, 75, 88, 90, 93, 98, 99, 100, 102, 103, 104, 105, 106, 107, 108, 109, 112, 113, 114, 117, 118, 119], "lava": [2, 21, 55], "sutton": [2, 92, 93, 103, 104, 111, 112, 116], "barton": 2, "gridworld": [2, 109, 112, 117], "true": [2, 8, 12, 14, 15, 17, 18, 19, 21, 22, 24, 50, 51, 52, 53, 54, 88, 89, 90, 98, 99, 100, 101, 107, 108, 111, 113, 116, 117, 119], "condit": [2, 116, 118, 119], "outsid": [2, 89, 90, 118], "scope": [2, 118], "satisfi": 2, "typic": [2, 14, 114], "timelimit": [2, 8, 16, 18, 21, 117, 118], "could": [2, 14, 19, 20, 21, 24, 116, 117, 118, 119], "also": [2, 8, 11, 14, 15, 16, 18, 19, 21, 24, 36, 57, 58, 69, 70, 72, 88, 89, 90, 91, 97, 98, 99, 100, 101, 107, 108, 109, 116, 117, 118, 119], "indic": [2, 14, 18, 23, 89, 92, 93, 98, 101, 102, 111, 112, 113, 114, 116, 118, 119], "physic": [2, 87, 97, 103, 104, 119], "go": [2, 48, 75, 79, 89, 111, 116, 118, 119], "out": [2, 4, 13, 24, 33, 38, 55, 58, 66, 71, 76, 117, 118, 119], "bound": [2, 7, 11, 16, 17, 21, 23, 90, 92, 93, 94, 95, 96, 118], "prematur": 2, "auxiliari": [2, 117], "diagnost": 2, "log": [2, 119], "might": [2, 9, 11, 12, 16, 17, 18, 19, 20, 23, 116, 117, 119], "instanc": [2, 4, 8, 9, 10, 12, 13, 14, 15, 16, 18, 20, 21, 109], "describ": [2, 10, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 93, 107, 111], "perform": [2, 3, 14, 18, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 106, 109, 119], "variabl": [2, 9, 11, 15, 18, 100, 107, 108, 109, 116, 117, 118, 119], "hidden": [2, 97, 119], "individu": [2, 3, 16, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 117, 119], "term": [2, 16, 91, 92, 97, 98, 99, 100, 101, 105, 106, 107, 108, 117], "combin": [2, 9, 14, 16, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 106], "produc": [2, 16, 18, 102, 117], "total": [2, 44, 88, 89, 90, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 114, 119], "In": [2, 3, 11, 14, 15, 16, 17, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 91, 92, 98, 99, 100, 101, 107, 108, 114, 116, 117, 118, 119], "openai": [2, 8, 15, 16, 21, 23, 87, 115, 116, 118, 119], "gym": [2, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 87, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 116, 117, 118, 119], "v26": [2, 119], "distinguish": [2, 117, 118], "howev": [2, 3, 8, 9, 10, 11, 12, 15, 16, 17, 18, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 98, 99, 100, 101, 105, 106, 116, 117, 118], "deprec": 2, "favour": [2, 22, 23], "boolean": [2, 9, 14, 18, 23, 90, 116, 119], "valu": [2, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 21, 23, 24, 74, 88, 90, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116, 118, 119], "case": [2, 4, 9, 10, 11, 16, 17, 19, 21, 23, 57, 69, 89, 98, 99, 100, 101, 107, 108, 114, 117, 118, 119], "further": [2, 23, 74, 90, 105, 106, 119], "undefin": 2, "signal": [2, 16, 18, 21, 98, 100, 101, 108, 114, 117, 118], "mai": [2, 11, 12, 14, 15, 17, 18, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 100, 101, 107, 108, 113, 117], "emit": [2, 16, 18], "differ": [2, 9, 10, 14, 15, 16, 17, 18, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 96, 98, 99, 100, 101, 102, 103, 104, 108, 109, 117, 118], "reason": [2, 23, 90], "mayb": 2, "underli": [2, 16, 18, 21, 92], "solv": [2, 88, 91, 93, 97, 103, 104, 117, 119], "successfulli": [2, 114], "certain": [2, 47, 49, 103, 104, 106, 116], "exceed": [2, 16, 18, 21, 98, 100, 101, 108, 116], "simul": [2, 24, 50, 51, 52, 53, 54, 97, 101, 102, 103, 104, 116, 119], "enter": [2, 14, 31, 33, 60, 90, 112], "invalid": [2, 11, 116], "int": [2, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 24, 111, 112, 113, 114, 116, 117, 119], "none": [2, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 23, 113, 116, 117], "option": [2, 4, 7, 8, 9, 10, 11, 14, 15, 16, 18, 19, 21, 23, 89, 92, 93, 94, 95, 96, 117], "intern": [2, 4, 15, 19], "new": [2, 3, 9, 16, 17, 18, 19, 21, 22, 23, 28, 31, 33, 46, 92, 93, 94, 95, 96, 106, 109, 114, 116, 117, 118], "often": [2, 9, 97, 117], "some": [2, 9, 10, 11, 15, 16, 18, 19, 20, 21, 23, 24, 40, 48, 66, 89, 91, 92, 97, 106, 107, 114, 116, 117], "explor": [2, 9, 54, 109, 116], "generalis": 2, "polici": [2, 19, 20, 21, 23, 91, 97, 98, 99, 100, 101, 102, 107, 108, 109, 115, 118], "control": [2, 9, 11, 20, 21, 23, 24, 26, 29, 31, 32, 33, 34, 35, 40, 42, 45, 52, 53, 54, 57, 59, 66, 67, 69, 71, 72, 73, 74, 75, 76, 79, 80, 87, 89, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "alreadi": [2, 3, 16, 19, 21], "rng": [2, 4, 9, 10, 11, 117], "therefor": [2, 3, 9, 15, 23], "right": [2, 11, 24, 26, 28, 29, 30, 31, 35, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 59, 61, 63, 64, 65, 67, 70, 75, 77, 78, 80, 81, 84, 85, 88, 89, 90, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 107, 108, 112, 113, 114, 116, 117, 119], "after": [2, 4, 8, 14, 15, 18, 19, 21, 32, 36, 41, 47, 51, 55, 77, 90, 98, 99, 100, 101, 102, 107, 108, 111, 114, 116, 117, 118, 119], "never": 2, "again": [2, 90, 117], "custom": [2, 7, 9, 14, 15, 19, 21, 23, 24, 50, 51, 52, 53, 54, 107, 109, 113], "line": [2, 23, 47, 92, 114, 117], "correctli": [2, 19, 20, 117], "v0": [2, 3, 8, 15, 16, 18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 117, 118, 119], "25": [2, 12, 24, 50, 51, 52, 53, 54, 98, 100, 101, 102, 108, 114], "return_info": 2, "now": [2, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 116, 117, 118, 119], "expect": [2, 9, 10, 11, 15, 18, 21, 119], "prng": [2, 9, 10, 11], "doe": [2, 8, 10, 12, 14, 15, 16, 18, 22, 36, 52, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 117, 118], "pass": [2, 4, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 90, 98, 99, 100, 101, 107, 108, 117], "chosen": [2, 11, 24], "sourc": [2, 97, 109, 116, 117, 118, 119], "entropi": 2, "timestamp": 2, "dev": [2, 119], "urandom": 2, "integ": [2, 10, 11, 12, 14, 18, 19, 23, 24, 117], "even": [2, 8, 25, 27, 33, 34, 36, 38, 41, 42, 45, 55, 56, 57, 59, 60, 62, 66, 69, 71, 72, 73, 74, 76, 79, 83, 86, 102, 116, 117], "exist": [2, 8, 9, 15, 16, 21], "usual": [2, 10, 11, 16, 18, 24, 50, 51, 52, 53, 54, 56, 100, 116, 117], "been": [2, 14, 18, 21, 23, 98, 101, 102, 109, 117, 118], "refer": [2, 14, 18, 21, 23, 117, 118], "minim": [2, 117, 118, 119], "abov": [2, 10, 11, 14, 22, 23, 24, 50, 51, 52, 53, 54, 92, 93, 96, 97, 119], "paradigm": 2, "specifi": [2, 9, 10, 11, 14, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 90, 91, 96, 100, 101, 105, 106, 108, 110, 113, 114, 117], "how": [2, 9, 14, 15, 21, 56, 58, 59, 102, 103, 105, 106, 116, 117, 118, 119], "depend": [2, 3, 10, 14, 19, 20, 24, 26, 27, 28, 29, 30, 31, 32, 35, 36, 37, 39, 40, 42, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 59, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 87, 91, 93, 97, 98, 99, 100, 101, 107, 108, 109, 113], "specif": [2, 8, 11, 18, 118, 119], "analog": [2, 24], "dictionari": [2, 9, 10, 14, 15, 16, 18, 19, 21, 116, 117, 119], "complement": 2, "It": [2, 8, 10, 11, 14, 15, 16, 18, 21, 24, 25, 26, 27, 28, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 83, 84, 85, 88, 97, 98, 99, 100, 101, 102, 105, 106, 107, 108, 109, 116, 117, 119], "renderfram": [2, 14], "list": [2, 8, 9, 10, 11, 14, 15, 16, 19, 21, 24, 116], "comput": [2, 14, 67, 79, 98, 103, 105, 106, 109, 116, 117], "frame": [2, 14, 18, 19, 24, 37, 89, 90, 102, 105], "render_mod": [2, 14, 15, 16, 18, 19, 21, 23, 24, 115, 117], "wai": [2, 10, 16, 21, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 116, 118], "most": [2, 9, 16, 18, 19, 21, 23, 24, 50, 51, 52, 53, 54, 106, 116, 117], "achiev": [2, 24, 27, 92, 111], "appli": [2, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 88, 90, 91, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 116, 117, 119], "collect": [2, 3, 15, 27, 30, 48, 62, 63, 66, 82, 109, 116], "As": [2, 3, 15, 16, 21, 80, 92, 97, 98, 99, 101, 102, 110, 112, 114, 119], "known": [2, 18, 31], "__init__": [2, 10, 13, 16, 17, 19, 20, 116, 117, 119], "initialis": [2, 18, 23, 111], "By": [2, 8, 18, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 98, 99, 100, 101, 107, 108], "continu": [2, 9, 16, 17, 21, 29, 30, 89, 90, 91, 94, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 116, 118, 119], "current": [2, 3, 11, 14, 16, 18, 19, 24, 89, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 116, 117, 119], "displai": [2, 8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 93, 117], "consumpt": 2, "occur": [2, 18, 92, 93, 117], "repres": [2, 10, 11, 14, 21, 23, 90, 92, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 112, 113, 114, 115, 117, 119], "np": [2, 7, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 90, 114, 116, 117, 119], "ndarrai": [2, 4, 7, 8, 10, 11, 12, 13, 14, 17, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 114, 119], "shape": [2, 9, 10, 11, 12, 13, 16, 17, 18, 19, 21, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 117, 119], "x": [2, 9, 12, 90, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 109, 112, 117, 119], "y": [2, 24, 90, 96, 98, 99, 101, 102, 103, 105, 106, 107, 114, 119], "3": [2, 7, 8, 10, 11, 12, 13, 14, 15, 18, 19, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116, 117, 119], "rgb": [2, 16, 18, 19, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 98, 99, 100, 101, 102, 103, 104, 107, 108], "pixel": [2, 16, 89, 109, 117], "imag": [2, 9, 15, 16, 18, 19, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89], "string": [2, 8, 9, 11, 14, 19], "stringio": 2, "style": [2, 15, 18, 109, 119], "represent": [2, 21, 118], "each": [2, 3, 8, 9, 10, 11, 14, 15, 16, 17, 19, 21, 24, 44, 46, 47, 48, 49, 52, 60, 67, 69, 70, 71, 72, 73, 74, 75, 87, 88, 90, 91, 92, 93, 94, 95, 98, 101, 102, 103, 104, 105, 109, 110, 112, 114, 116, 117], "includ": [2, 8, 19, 21, 22, 23, 24, 93, 98, 99, 100, 101, 103, 104, 105, 106, 107, 108, 109, 114, 117, 118], "newlin": 2, "escap": [2, 43, 58, 62], "sequenc": [2, 8, 9, 11, 12, 15, 19, 21, 24, 109], "color": [2, 10, 28, 39, 52, 70, 114], "rgb_array_list": [2, 14, 16, 18], "ansi_list": 2, "base": [2, 3, 4, 9, 10, 15, 16, 17, 18, 19, 20, 21, 48, 57, 74, 87, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 114, 116, 117, 119], "except": [2, 71, 74, 117], "rendercollect": [2, 3, 16, 18], "pop": [2, 106], "kei": [2, 8, 9, 10, 11, 14, 15, 16, 18, 19, 21, 24, 25, 56, 98, 99, 100, 101, 105, 106, 107, 108, 112, 113, 114, 116, 117, 118], "support": [2, 3, 9, 10, 12, 14, 15, 16, 18, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 117], "longer": [2, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 100, 101, 102, 103, 104, 105, 106, 108, 109, 119], "accept": [2, 14, 18, 24, 117], "rather": [2, 23, 89, 109, 116], "v1": [2, 7, 8, 14, 15, 18, 19, 20, 21, 88, 89, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 113, 114, 116], "type": [2, 9, 10, 11, 15, 16, 17, 19, 21, 23, 46, 89, 98, 99, 100, 101, 107, 108, 109, 117, 119], "discret": [2, 9, 10, 12, 13, 15, 17, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 90, 92, 93, 94, 95, 110, 111, 112, 113, 114, 116, 117], "give": [2, 27, 28, 46, 47, 90, 105, 111, 114, 116, 119], "2": [2, 7, 10, 11, 12, 13, 14, 15, 17, 19, 20, 24, 25, 26, 28, 29, 30, 31, 32, 34, 35, 37, 39, 40, 42, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 79, 80, 81, 82, 84, 85, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 117, 119], "mean": [2, 21, 23, 92, 98, 99, 100, 105, 117, 119], "two": [2, 10, 11, 14, 15, 18, 23, 24, 26, 37, 79, 88, 90, 92, 94, 95, 97, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 116, 117], "1": [2, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116, 117, 118, 119], "box": [2, 9, 10, 12, 13, 15, 16, 17, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 117], "4028234663852886e": 2, "38": [2, 101, 102], "4": [2, 11, 12, 14, 15, 16, 17, 18, 19, 21, 24, 26, 28, 29, 30, 31, 33, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 58, 61, 63, 64, 65, 67, 68, 69, 70, 77, 78, 80, 81, 82, 84, 85, 88, 89, 90, 92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116, 117, 119], "float32": [2, 10, 11, 12, 13, 15, 16, 17, 19, 21, 88, 89, 90, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "denot": [2, 93], "well": [2, 9, 31, 74, 92, 98, 101, 102, 109, 117], "high": [2, 3, 10, 11, 12, 13, 15, 19, 21, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109], "8000002e": 2, "00": 2, "4028235e": 2, "1887903e": 2, "01": [2, 20, 90, 98, 99, 102, 103, 104, 105, 106, 107, 116], "dtype": [2, 9, 10, 11, 12, 13, 15, 19, 90, 117], "low": [2, 10, 11, 12, 13, 19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109], "etc": [2, 9, 16, 69, 72, 76, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 117, 118], "determin": [2, 11, 24, 90, 92, 93, 94, 95, 96, 109, 113, 117, 118], "inf": [2, 19, 93, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "envspec": [2, 8, 16], "normal": [2, 11, 16, 18, 88, 89, 96, 98, 99, 103, 119], "finish": [2, 89, 90], "code": [2, 4, 9, 10, 14, 15, 16, 18, 19, 20, 92, 109, 116, 117, 119], "clean": 2, "up": [2, 10, 11, 15, 19, 24, 25, 27, 28, 29, 30, 31, 33, 34, 35, 37, 40, 43, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 57, 58, 61, 63, 68, 70, 71, 72, 74, 75, 78, 79, 80, 81, 84, 85, 88, 90, 97, 98, 101, 102, 106, 111, 112, 113, 114, 116, 117], "window": [2, 14, 44, 89, 117], "http": [2, 14, 16, 24, 89, 92, 111, 112, 113, 116, 117, 119], "connect": [2, 10, 92, 98, 99, 100, 106, 107, 108], "properti": [2, 9, 16, 118], "unwrap": [2, 16, 21, 92], "non": [2, 9, 12, 14, 113, 117, 118, 119], "wrap": [2, 7, 8, 14, 15, 16, 18, 19, 20, 21, 117, 119], "_np_random": 2, "meth": 2, "much": [2, 24, 50, 51, 52, 53, 54, 58, 59, 102, 117, 118], "creat": [2, 8, 11, 13, 14, 15, 18, 21, 34, 88, 89, 90, 105, 106, 116, 119], "creation": [2, 15, 117], "tutori": [2, 21, 23, 116, 119], "gymnasium": [3, 7, 8, 9, 10, 11, 12, 13, 14, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 118, 119], "env": [3, 4, 7, 8, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 112, 113, 114, 115, 116, 118, 119], "flexibl": [3, 15, 109], "implement": [3, 9, 10, 15, 17, 18, 19, 20, 21, 22, 23, 24, 96, 103, 109, 110, 114, 117, 119], "complic": [3, 11, 16], "parallel": [3, 15], "propos": [3, 109], "funcenv": 3, "part": [3, 18, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 118], "its": [3, 14, 15, 17, 18, 39, 46, 69, 81, 86, 90, 96, 97, 107, 109, 119], "own": [3, 15, 23, 39, 74], "relat": [3, 119], "larg": [3, 15, 16, 23, 95, 98, 99, 100, 101, 102, 105, 106, 107, 108, 109], "believ": 3, "improv": [3, 15], "arbitrarili": 3, "complex": [3, 9, 10, 101, 102, 103, 104, 119], "rl": [3, 14, 18, 115, 116, 118, 119], "advanc": [3, 15, 92], "becom": [3, 73, 87, 118], "were": [3, 19, 23, 41, 87, 92, 117], "mind": 3, "jax": [3, 109], "pytorch": [3, 119], "data": [3, 9, 12, 14, 16, 23, 116, 117, 119], "With": [3, 112, 116], "hardwar": 3, "acceler": [3, 89, 94, 95, 96], "brax": [3, 109], "written": [3, 14, 16, 23], "similar": [3, 10, 23, 28, 39, 105, 117], "program": [3, 15], "game": [3, 11, 14, 18, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 63, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 87, 111, 112, 113, 116, 117], "town": 3, "anymor": 3, "upgrad": 3, "jumpi": 3, "torch": [3, 119], "project": [3, 21, 23, 109, 116], "like": [3, 4, 9, 11, 14, 16, 17, 18, 19, 20, 21, 26, 27, 28, 29, 30, 31, 32, 33, 35, 37, 39, 40, 44, 46, 47, 48, 49, 58, 61, 63, 64, 65, 66, 67, 68, 69, 70, 75, 77, 78, 80, 81, 82, 84, 85, 88, 90, 98, 99, 101, 102, 104, 105, 106, 108, 114, 117], "supersuit": 3, "aim": [3, 56, 100, 103, 107, 108, 119], "bring": 3, "detail": [3, 9, 14, 18, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 109, 117], "caus": [3, 18, 21, 57, 114], "ad": [3, 16, 18, 19, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 114, 117], "v28": 3, "rewrit": 3, "vectorenv": [3, 9], "inherit": [3, 9, 16, 17, 19, 20, 21, 117], "vectoris": [3, 9, 109], "old": [3, 15, 16, 18, 22, 115], "tree": [3, 75], "structur": [3, 4, 9, 10, 12, 117], "transformobserv": [3, 16, 19], "lambdaobservationv0": [3, 7], "vectorlambdaobserv": 3, "No": [3, 18, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 119], "filterobserv": [3, 16, 19], "vectorfilterobserv": 3, "ye": 3, "flattenobserv": [3, 10, 16, 19, 117], "vectorflattenobserv": 3, "grayscaleobserv": [3, 16, 19], "vectorgrayscaleobserv": 3, "pixelobservationwrapp": [3, 16, 19], "pixelobserv": 3, "vectorpixelobserv": 3, "resizeobserv": [3, 16, 19], "vectorresizeobserv": 3, "Not": [3, 18], "reshapeobserv": 3, "vectorreshapeobserv": 3, "rescaleobserv": 3, "vectorrescaleobserv": 3, "dtypeobserv": 3, "vectordtypeobserv": 3, "normalizeobserv": [3, 16, 19], "vectornormalizeobserv": 3, "timeawareobserv": [3, 16, 19, 21], "vectortimeawareobserv": 3, "framestack": [3, 16, 18], "framestackobserv": 3, "vectorframestackobserv": 3, "delayobserv": 3, "vectordelayobserv": 3, "ataripreprocess": [3, 16, 18], "lambdaactionv0": [3, 7], "vectorlambdaact": 3, "clipact": [3, 16, 17, 21], "vectorclipact": 3, "rescaleact": [3, 16, 17, 21], "vectorrescaleact": 3, "nanact": 3, "vectornanact": 3, "stickyact": 3, "vectorstickyact": 3, "transformreward": [3, 16, 20], "lambdarewardv0": [3, 7], "vectorlambdareward": 3, "cliprewardv0": [3, 7], "vectorclipreward": 3, "rescalereward": 3, "vectorrescalereward": 3, "normalizereward": [3, 16, 20], "vectornormalizereward": 3, "autoresetwrapp": [3, 8, 16, 18, 117], "autoreset": [3, 8, 15, 117], "vectorautoreset": 3, "passiveenvcheck": [3, 18, 21], "vectorpassiveenvcheck": 3, "orderenforc": [3, 16, 18, 21, 117], "vectororderenforc": 3, "envcompat": [3, 16, 18, 22, 23], "shimmi": 3, "recordepisodestatist": [3, 16, 18, 23, 116, 119], "vectorrecordepisodestatist": 3, "vectorrendercollect": 3, "humanrend": [3, 16, 18], "jaxtonumpi": 3, "vectorjaxtonumpi": 3, "jaxtotorch": 3, "vectorjaxtotorch": 3, "vectorlistinfo": [3, 15, 16, 18], "These": [3, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 97, 98, 101, 107, 116, 119], "28": [3, 24, 33, 39, 92, 101, 102], "templat": 4, "meant": 4, "stateless": 4, "manner": [4, 11, 16, 19, 56], "being": [4, 8, 12, 18, 45, 94, 95, 96, 98, 101, 102, 106, 116], "around": [4, 18, 34, 87, 106, 109], "explicitli": [4, 117, 118], "That": [4, 93], "said": [4, 98, 100, 101, 108], "noth": [4, 89, 90, 119], "here": [4, 14, 92, 117], "prevent": [4, 11, 15, 47, 109], "statefulli": 4, "just": [4, 16, 21, 50, 56, 73, 104, 106], "recommend": [4, 8, 15, 18, 23, 24, 50, 51, 52, 53, 54, 90, 98, 101, 102, 116, 117], "consist": [4, 11, 16, 19, 21, 24, 37, 88, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 116, 117, 119], "method": [4, 10, 14, 17, 18, 19, 20, 22, 117, 119], "pomdp": 4, "given": [4, 8, 11, 16, 19, 71, 74, 88, 90, 91, 92, 94, 95, 98, 100, 101, 108, 116, 118], "transit": [4, 14, 21, 24, 50, 51, 52, 53, 54, 101, 102, 112, 113, 114, 118], "next_stat": [4, 116], "state_info": 4, "step_info": 4, "serv": [4, 9, 98, 99, 100, 101, 107, 108, 119], "purpos": [4, 9, 119], "allow": [4, 7, 8, 9, 10, 14, 16, 21, 22, 23, 24, 55, 73, 92, 93, 94, 95, 96, 103, 104, 105, 106, 109, 117, 119], "constant": [4, 35, 74, 90, 95, 98, 100, 101, 108], "them": [4, 9, 16, 18, 22, 23, 24, 26, 27, 28, 31, 32, 36, 40, 47, 68, 77, 90, 99, 106, 114], "itself": [4, 12, 15, 16, 18, 21, 22], "moment": [4, 74], "predominantli": 4, "futur": [4, 80, 109], "intend": [4, 18, 113], "flesh": 4, "offici": 4, "expos": 4, "statetyp": 4, "rewardtyp": 4, "terminaltyp": 4, "full": [4, 21, 24, 50, 51, 52, 53, 54, 89, 90, 116], "transform": [4, 9, 12, 14, 16, 17, 18, 106], "func": [4, 7, 12], "callabl": [4, 7, 8, 13, 14, 15, 18, 19, 20], "render_imag": 4, "render_st": 4, "renderstatetyp": 4, "show": [4, 19, 23, 24, 34, 40, 111, 116, 119], "render_init": 4, "kwarg": [4, 8, 14, 15, 22, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 117], "render_clos": 4, "autoclass": 4, "gymasnium": 4, "experiment": [7, 92], "argtyp": 7, "constructor": [7, 8, 9, 10, 11, 14, 16, 17, 19, 20, 21, 117], "environ": [7, 9, 11, 13, 16, 17, 19, 20, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 110, 111, 112, 113, 114, 118, 119], "lambdaact": 7, "_": [7, 13, 14, 15, 16, 21, 115], "rew": [7, 14, 118], "min_reward": [7, 20], "union": [7, 8, 10, 11, 12, 13, 14, 15, 17, 19], "float": [7, 8, 11, 12, 14, 16, 17, 19, 20, 24, 55, 68, 90, 98, 99, 100, 101, 107, 108, 116, 117, 119], "max_reward": [7, 20], "clip": [7, 16, 20, 21, 94, 95, 98, 101, 117], "between": [7, 10, 11, 18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 116, 117, 118, 119], "upper": [7, 11, 21, 101, 102], "lower": [7, 11, 21, 98, 99, 100, 101, 102, 105, 106, 107, 108, 116], "5": [7, 10, 11, 12, 13, 17, 18, 24, 26, 28, 29, 30, 31, 34, 35, 37, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 65, 67, 68, 70, 77, 78, 80, 81, 82, 84, 85, 88, 89, 90, 92, 94, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 114, 116, 117, 119], "cliprewardsv0": 7, "higher": [7, 88], "load": 8, "pre": [8, 113], "sever": [8, 11, 16, 18, 21, 23, 24, 54, 109], "id": [8, 15, 113, 117], "liter": 8, "mountaincar": [8, 94], "mountaincarcontinu": [8, 95], "pendulum": [8, 15, 19, 21, 91, 92, 93, 97, 119], "acrobot": [8, 91], "lunarland": [8, 18, 21, 23, 90, 115], "v2": [8, 17, 18, 21, 23, 88, 89, 90, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 114, 115], "lunarlandercontinu": [8, 17], "bipedalwalk": [8, 16, 17, 21, 88], "v3": [8, 16, 17, 21, 88, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 114], "bipedalwalkerhardcor": 8, "carrac": [8, 14, 19, 89], "blackjack": [8, 21, 110], "frozenlak": [8, 14, 113], "frozenlake8x8": 8, "cliffwalk": [8, 112], "taxi": [8, 110], "reacher": [8, 16, 97, 105], "v4": [8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 119], "pusher": 8, "invertedpendulum": [8, 97, 103, 104, 119], "inverteddoublependulum": [8, 103], "halfcheetah": [8, 97, 99], "hopper": [8, 97, 108], "swimmer": [8, 97], "walker2d": [8, 97], "ant": [8, 97, 100, 108], "humanoidstandup": [8, 97, 102], "humanoid": [8, 45, 97, 98], "accord": [8, 10, 11, 15, 90], "find": [8, 24, 25, 50, 51, 52, 53, 54, 60, 69, 81, 103, 106, 117], "avail": [8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 109, 111, 112, 117], "modul": [8, 13, 117, 119], "eg": [8, 14, 117], "max_episode_step": [8, 18, 117], "length": [8, 10, 11, 14, 16, 18, 19, 88, 92, 93, 94, 95, 99, 107, 109, 113, 114, 116], "apply_api_compat": [8, 18, 22], "stepapicompat": [8, 16, 18, 22], "argument": [8, 9, 10, 11, 12, 14, 15, 19, 21, 22, 87, 91, 110, 116, 117], "fals": [8, 14, 15, 18, 19, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 90, 98, 99, 100, 101, 107, 108, 111, 116, 117, 119], "disable_env_check": [8, 15], "checker": [8, 15], "addit": [8, 9, 15, 16, 18, 21, 23, 24, 30, 41, 71, 75, 90, 91, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 114, 116, 117, 119], "rais": [8, 11, 12, 13, 14, 15, 18, 19, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "error": [8, 11, 12, 14, 16, 18, 116, 118], "entry_point": [8, 117], "reward_threshold": [8, 98, 99, 100, 101, 102, 105, 106, 107, 108, 117], "nondeterminist": [8, 117], "order_enforc": [8, 117], "syntax": 8, "namespac": [8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 117], "env_nam": [8, 22], "v": [8, 73, 94, 103], "keyword": [8, 10, 15, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 111, 116, 117], "entri": 8, "point": [8, 12, 14, 16, 24, 27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 45, 46, 47, 48, 49, 51, 55, 56, 59, 66, 67, 68, 69, 70, 71, 72, 74, 76, 77, 78, 80, 81, 84, 88, 89, 90, 92, 93, 96, 106, 111, 118], "threshold": [8, 92, 93, 114, 117], "consid": [8, 19, 89, 90, 91, 97, 98, 100, 101, 108, 117], "learnt": 8, "knowledg": 8, "limit": [8, 21, 40, 48, 55, 56, 69, 74, 103, 104, 116, 119], "enabl": [8, 16, 24, 89, 109], "order": [8, 9, 10, 16, 21, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 117], "enforc": 8, "correct": [8, 114, 117, 118], "disabl": [8, 18, 113], "pprint_registri": 8, "onli": [8, 9, 10, 11, 12, 15, 16, 17, 18, 19, 23, 24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 61, 63, 64, 65, 67, 68, 70, 71, 72, 73, 74, 75, 77, 78, 80, 81, 82, 84, 85, 94, 95, 98, 99, 100, 101, 103, 105, 106, 108, 109, 116, 117], "env_id": [8, 22], "retriev": [8, 18, 45, 48, 74], "global": 8, "_registri": 8, "num_col": 8, "exclude_namespac": 8, "disable_print": 8, "column": [8, 119], "arrang": 8, "exclud": [8, 98, 99, 100, 101, 107, 108], "instead": [8, 15, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 92, 108, 117], "consol": [8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "npt": [9, 10, 11], "dtypelik": 9, "superclass": [9, 17, 19, 20], "crucial": 9, "thei": [9, 15, 18, 19, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 106, 110, 111, 112, 113, 117], "variou": [9, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 102, 109, 119], "clearli": 9, "interact": [9, 14, 24, 109, 116, 117], "look": [9, 14, 16, 18, 20, 21, 24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 58, 61, 63, 64, 65, 67, 68, 70, 73, 75, 77, 78, 80, 81, 82, 84, 85, 117, 118], "u": [9, 16, 20, 24, 116, 117, 119], "work": [9, 14, 16, 18, 19, 24, 89, 90, 92, 99, 100, 103, 104, 108], "highli": [9, 23, 24, 87, 91, 109, 117], "form": [9, 10, 11, 18, 92, 107, 117], "painlessli": 9, "flat": [9, 10, 11, 12, 19], "sampl": [9, 10, 11, 12, 13, 14, 15, 19, 20, 21, 23, 90, 114, 115, 116, 117, 119], "especi": [9, 20, 117], "hierarch": [9, 114], "via": [9, 10, 16, 18, 19, 20, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 91, 97, 109, 110, 117, 119], "build": [9, 16, 26, 44, 48, 103, 108], "express": [9, 14, 98, 101, 102], "cover": [9, 116], "parametr": [9, 119], "probabl": [9, 24, 112, 113, 114, 116, 118, 119], "distribut": [9, 10, 11, 107, 109, 113, 119], "batch": [9, 13, 15], "moreov": [9, 18, 24, 27, 37, 117], "handl": [9, 15, 103, 111, 116], "care": [9, 75], "immut": 9, "mask": [9, 10, 11, 23, 114], "t_cov": 9, "randomli": [9, 10, 90, 113, 117], "uniform": [9, 11, 12, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "bounded": 9, "int8": [9, 11], "member": [9, 58], "possibli": [9, 10, 11, 13, 16, 18, 21, 109], "subspac": [9, 10, 11, 12], "to_json": 9, "sample_n": 9, "jsonabl": 9, "from_json": 9, "matric": [9, 109], "multidiscret": [9, 10, 12, 13, 15, 21, 117], "binari": [9, 11, 21, 117], "hold": [9, 111, 116], "down": [9, 11, 24, 28, 30, 31, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 57, 58, 61, 63, 65, 66, 68, 70, 78, 80, 81, 84, 85, 89, 102, 111, 112, 113, 114, 116, 117, 118], "button": [9, 11, 14, 21], "multibinari": [9, 10, 12, 13, 21], "multipl": [9, 10, 11, 13, 15], "ax": [9, 11, 116, 117], "messag": 9, "mission": [9, 57, 59, 60], "join": 9, "togeth": [9, 24, 97], "separ": [9, 10, 23, 117], "readabl": [9, 10], "fix": [9, 10, 11, 16, 18, 20, 21, 23, 57, 92, 93, 96, 97, 98, 99, 100, 101, 103, 104, 108, 111, 113, 117, 119], "unord": 9, "entiti": 9, "select": [9, 11, 47, 98, 101, 102, 105, 106], "graph": [9, 12, 21], "node": [9, 10, 12], "edg": [9, 10, 12, 93], "flatten": [9, 12, 16, 97, 116, 117], "unflatten": [9, 12], "neural": [9, 12, 92, 107, 109, 119], "network": [9, 12, 107], "flatdim": [9, 12], "dimens": [9, 11, 12, 19, 98, 99, 100, 101, 107, 108, 109, 119], "flatten_spac": [9, 12], "revers": [9, 12, 111, 119], "size": [9, 18, 113, 117], "batch_spac": [9, 13], "concaten": [9, 12, 13, 97], "iter": [9, 10, 13, 15], "create_empty_arrai": [9, 13], "create_shared_memori": [9, 13], "read_from_shared_memori": [9, 13], "write_to_shared_memori": [9, 13], "spaces_kwarg": 10, "constitu": 10, "usag": [10, 11, 12, 16, 89], "ordereddict": [10, 13, 19], "nest": [10, 13, 109], "ext_control": 10, "inner_st": 10, "charg": 10, "100": [10, 12, 18, 38, 48, 71, 72, 88, 89, 90, 92, 95, 100, 105, 112, 113], "system_check": 10, "10": [10, 11, 17, 24, 31, 37, 50, 51, 52, 53, 54, 61, 68, 71, 74, 88, 90, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 112, 114, 116, 117, 119], "job_statu": 10, "progress": [10, 80], "conveni": [10, 16, 21, 117], "easili": [10, 16], "deal": 10, "instanti": [10, 14, 18, 19, 20, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 117], "either": [10, 11, 12, 14, 18, 21, 22, 24, 47, 57, 94, 95, 111, 113, 119], "avoid": [10, 13, 16, 21, 24, 27, 28, 30, 35, 36, 44, 46, 62, 63, 65, 70, 72, 73, 78, 112, 114], "independ": [10, 11, 15, 100, 106, 107, 108], "same": [10, 12, 14, 15, 19, 56, 88, 89, 92, 105, 106, 107, 114, 116, 118], "attr": 10, "warn": [10, 14, 15, 18], "guarante": [10, 24], "uniqu": [10, 87, 91, 97, 103], "sub": [10, 15, 74], "precis": 10, "cartesian": [10, 11, 96], "product": [10, 11], "03633198": 10, "42370757": 10, "involv": [10, 87, 103, 104, 109, 112, 113, 114, 117, 119], "reproduc": [10, 23], "draw": [10, 111, 116, 117], "42": [10, 11, 93, 101, 102, 115], "54": 10, "finit": [10, 11, 17, 98, 102, 103, 104, 105, 106, 108, 118, 119], "a_0": 10, "dot": [10, 11, 117], "a_n": 10, "a_i": 10, "belong": [10, 13], "n": [10, 11, 12, 13, 21, 24, 43, 89, 92, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 116, 119], "0259352": 10, "80977976": 10, "80066574": 10, "77165383": 10, "must": [10, 12, 13, 14, 15, 16, 17, 18, 19, 21, 23, 24, 25, 26, 29, 31, 32, 33, 34, 36, 40, 41, 42, 45, 48, 49, 58, 62, 64, 65, 70, 89, 100, 108, 117, 118], "length_mask": 10, "sample_mask": 10, "drawn": [10, 11, 105, 107, 111], "geometr": 10, "featur": [10, 11, 109], "feature_spac": 10, "node_spac": [10, 12], "edge_spac": [10, 12], "seri": [10, 21], "adjac": 10, "matrix": 10, "edge_link": [10, 12], "num_nod": 10, "num_edg": 10, "graphinst": [10, 12], "don": [10, 16, 23, 24, 40, 50, 51, 52, 53, 54, 74, 89, 94, 117, 118], "edge_mask": 10, "multipli": [10, 95], "attribut": [10, 21, 23, 105, 106, 117], "unbound": 11, "mathbb": 11, "interv": [11, 21, 98, 100, 101, 108], "There": [11, 16, 21, 56, 57, 69, 88, 90, 91, 94, 95, 97, 102, 103, 104, 105, 106, 109, 112, 114, 117], "common": [11, 16, 19, 21, 118, 119], "ident": [11, 15, 19], "construct": [11, 24, 50, 51, 52, 53, 54, 92, 98, 99, 100, 101, 107, 108], "scalar": [11, 17], "respect": [11, 15, 16, 18, 21, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 98, 101, 102, 107], "assum": [11, 19, 117], "across": [11, 13, 30, 40, 51, 52, 55], "infer": [11, 97], "essenti": 11, "valueerror": [11, 12, 13, 15, 18, 19], "coordin": [11, 16, 19, 88, 90, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108], "shift": [11, 21], "exponenti": [11, 16, 20], "unsupport": 11, "is_bound": 11, "both": [11, 15, 18, 19, 21, 22, 88, 91, 92, 106, 108, 109, 111, 112, 113, 114, 117, 118, 119], "sens": [11, 109], "One": [11, 21, 98, 101, 102], "neither": [11, 18, 111], "nor": [11, 18, 111, 112], "mani": [11, 18, 19, 21, 24, 30, 33, 37, 56, 59, 74, 84, 116, 117], "subset": [11, 17, 24, 50, 51, 52, 53, 54, 117], "smallest": 11, "maskndarrai": 11, "uniformli": [11, 24, 92, 93, 105, 106, 117], "infeas": 11, "sort": 11, "fair": 11, "coin": 11, "toss": 11, "per": [11, 15, 37, 56, 79, 114, 118], "nvec": 11, "int64": [11, 12], "keyboard": [11, 14], "alwai": [11, 12, 18, 24, 90, 94, 95, 98, 101, 102, 105, 107, 111, 112, 113, 114, 117], "noop": [11, 14, 18, 24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 114], "nintendo": 11, "conceptu": 11, "arrow": [11, 68], "left": [11, 24, 26, 28, 29, 30, 31, 35, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 61, 63, 64, 65, 67, 70, 74, 75, 77, 78, 80, 81, 84, 85, 88, 89, 90, 93, 94, 98, 101, 102, 103, 104, 108, 112, 113, 114, 116, 117, 119], "param": 11, "min": [11, 17, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111], "max": [11, 17, 18, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 113, 116, 119], "press": [11, 14, 21, 89, 92], "although": 11, "rare": 11, "d": [11, 14, 92, 105, 106], "categor": 11, "vector": [11, 14, 16, 88, 90, 102, 103, 104, 105, 106, 119], "count": [11, 88, 90, 111, 116], "kind": 11, "unless": [11, 16, 111, 112, 113, 114, 117], "max_length": 11, "min_length": 11, "charset": 11, "alphanumer": 11, "compris": 11, "charact": [11, 14, 58, 69], "b5": 11, "hello": 11, "0123456789": 11, "digit": [11, 109], "inclus": [11, 24], "empti": [11, 13, 18, 74, 116, 119], "english": 11, "alphabet": 11, "plu": [11, 40, 112], "latin": 11, "charlist": 11, "zero": [11, 13, 96, 99, 109, 116, 117, 118, 119], "matter": 11, "equival": [12, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "would": [12, 17, 19, 20, 98, 99, 100, 101, 102, 107, 108, 115, 117], "notimplementederror": 12, "cannot": [12, 13, 18, 21, 23, 112, 117, 118], "attempt": [12, 90, 102, 103, 114], "compound": 12, "oper": [12, 18], "boundari": 12, "while": [12, 23, 24, 27, 28, 44, 59, 62, 63, 64, 65, 68, 70, 72, 74, 78, 81, 83, 90, 92, 93, 96, 98, 99, 101, 102, 105, 106, 107, 111, 112, 116, 117, 118, 119], "exactli": [12, 107], "origin": [12, 15, 17, 18, 19, 23, 89, 92, 103, 105, 106], "effect": [12, 13, 16, 18, 19, 21, 24, 50, 51, 52, 53, 54, 90, 103, 104, 114, 116, 119], "necessarili": 12, "hot": 12, "encod": [12, 114, 117], "60": [12, 58, 71, 109], "recurs": 12, "6": [12, 24, 28, 29, 30, 31, 35, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 65, 79, 80, 81, 84, 85, 92, 94, 95, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 112, 114, 119], "12": [12, 24, 31, 33, 37, 39, 50, 51, 52, 53, 54, 58, 61, 73, 90, 92, 93, 98, 99, 100, 101, 102, 105, 108, 111, 112, 116], "int32": 12, "15": [12, 13, 24, 47, 50, 51, 52, 53, 54, 58, 77, 90, 98, 99, 101, 102, 105, 108, 109, 113], "k": [12, 14, 18, 90, 107], "m": [12, 24, 43, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 117], "match": [12, 15, 17, 79], "copi": [13, 15, 117], "item": [13, 14, 109, 116], "6348213": 13, "28607962": 13, "60760117": 13, "87383074": 13, "192658": 13, "2148103": 13, "99644893": 13, "08304597": 13, "7238421": 13, "35848552": 13, "1533453": 13, "67958736": 13, "49076623": 13, "38661423": 13, "7975036": 13, "93317133": 13, "stopiter": 13, "fn": 13, "multi_binari": 13, "built": [13, 23, 109], "multi_discret": 13, "ctx": 13, "mp": 13, "multiprocess": [13, 15], "opt": 13, "hostedtoolcach": 13, "9": [13, 15, 24, 28, 31, 36, 45, 50, 51, 52, 53, 54, 58, 61, 71, 80, 85, 92, 96, 98, 99, 100, 101, 102, 103, 105, 106, 108, 111, 116], "x64": 13, "lib": [13, 112], "python3": 13, "process": [13, 14, 15, 19, 21, 92, 105, 117, 118], "eventu": 13, "shared_memori": [13, 15], "customspaceerror": 13, "read": [13, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "forward": [13, 35, 57, 88, 98, 99, 100, 101, 102, 107, 108, 119], "vice": [13, 18], "versa": [13, 18], "side": [13, 19, 26, 39, 54, 56, 90], "write": [13, 15, 117], "num_env": [13, 15], "plai": [14, 21, 34, 47, 60, 79, 84, 89, 109, 116, 117], "transpos": [14, 117], "zoom": 14, "callback": 14, "keys_to_act": 14, "w": [14, 98, 101, 102], "7": [14, 24, 28, 30, 31, 35, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 65, 80, 81, 84, 85, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108], "dw": 14, "particularli": [14, 18, 93], "verifi": 14, "level": [14, 21, 24, 31, 48, 70, 78, 109], "preprocess": [14, 16], "unplay": 14, "wish": [14, 19, 23], "real": [14, 56, 99], "statist": [14, 119], "playplot": 14, "last": [14, 18, 46, 47, 57, 99, 102, 105, 106, 117, 118], "150": 14, "def": [14, 16, 17, 19, 20, 116, 117, 119], "obs_t": 14, "obs_tp1": 14, "plotter": 14, "render_fp": [14, 18, 117], "30": [14, 18, 24, 68, 71, 101, 102], "amount": [14, 44, 46, 47, 49, 55, 74, 88, 93, 103, 104, 119], "input": [14, 15, 21, 116], "receiv": [14, 15, 21, 34, 37, 41, 44, 45, 51, 57, 60, 89, 90, 95, 108, 114, 116, 118, 119], "map": [14, 19, 21, 42, 113, 114, 116, 117, 119], "unicod": 14, "suppos": 14, "trigger": [14, 114], "key_to_act": 14, "ord": [14, 117], "unknown": [14, 109], "horizon_timestep": 14, "plot_nam": 14, "live": [14, 27, 30, 33, 34, 36, 39, 44, 45, 48, 55, 59, 60, 66, 72, 77, 116], "compute_metr": 14, "obs_tp": 14, "cumulative_reward": 14, "linalg": [14, 117], "norm": [14, 105, 106, 117], "along": [14, 16, 21, 22, 58, 59, 61, 72, 89, 93, 94, 95, 99, 103, 104, 107, 112], "conjunct": 14, "evolv": 14, "200": [14, 49, 72, 90, 92, 93, 94, 96, 113, 114], "immedi": [14, 16, 20, 111, 117], "cumul": [14, 16, 18], "magnitud": [14, 90, 95, 103, 104, 119], "your_env": 14, "len": [14, 17, 116], "horizon": [14, 74, 100, 108, 118], "titl": [14, 94, 95, 116, 119], "dependencynotinstal": [14, 18], "matplotlib": [14, 116, 119], "playablegam": 14, "process_ev": 14, "event": [14, 117], "particular": [14, 16, 19, 21, 22, 90, 118], "keep": [14, 16, 18, 32, 45, 64, 67, 75, 76, 84, 93, 102, 117], "track": [14, 16, 18, 76, 89, 93, 98, 99, 100, 101, 102, 103, 104, 107, 108], "exit": [14, 15], "save_video": 14, "video_fold": [14, 18], "episode_trigg": [14, 18], "step_trigg": [14, 18], "video_length": [14, 18], "name_prefix": [14, 18], "episode_index": 14, "step_starting_index": 14, "extract": 14, "compos": 14, "record": [14, 16, 88, 119], "store": [14, 15, 18, 119], "iff": [14, 18, 117], "isn": 14, "entir": [14, 18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 100, 108, 109], "snippet": [14, 18], "captur": [14, 18, 83], "Will": [14, 18], "prepend": [14, 18], "filenam": [14, 18], "moviepi": [14, 18], "imagesequenceclip": 14, "durat": [14, 98, 100, 101, 102, 103, 104, 105, 106, 108, 119], "step_index": 14, "199": 14, "capped_cubic_video_schedul": 14, "episode_id": 14, "8": [14, 15, 19, 20, 22, 24, 26, 28, 30, 31, 33, 35, 39, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 80, 84, 85, 89, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 113, 119], "27": [14, 92, 98, 101, 102], "729": 14, "1000": [14, 18, 21, 72, 74, 89, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 115, 119], "2000": [14, 88, 114], "3000": 14, "schedul": [14, 113], "step_api_compat": [14, 22], "step_return": 14, "output_truncation_bool": [14, 18], "is_vector_env": 14, "doc": [14, 18, 90], "ob": [14, 16, 19, 114, 116, 119], "interfac": [14, 115], "conflict": [14, 109], "final": [14, 15, 18, 57, 116, 117, 118], "desir": [14, 107, 108, 114], "oldenv": 14, "vec_env": 14, "convert_to_terminated_truncated_step_api": [14, 22], "irrespect": 14, "convert_to_done_step_api": 14, "omit": [14, 97, 98, 99, 100, 101, 102, 107, 108], "env_check": 14, "check_env": 14, "skip_render_check": 14, "invas": [14, 78], "farama": [14, 16, 109, 116, 117, 119], "org": [14, 24, 116, 119], "content": 14, "environment_cr": [14, 117], "ignor": [14, 24, 111, 116], "skip": [14, 18, 24, 117], "ci": 14, "linear": [15, 90, 92, 103, 104, 107, 119], "speed": [15, 35, 88, 89], "taken": [15, 18, 48, 54, 91, 93, 117, 119], "wait": [15, 48, 50, 74, 118], "until": [15, 16, 47, 60, 105, 111, 112, 113, 117, 119], "overwritten": [15, 16], "final_observ": [15, 18], "final_info": [15, 18], "asyncvectorenv": 15, "syncvectorenv": 15, "single_observation_spac": 15, "single_action_spac": 15, "v25": [15, 23], "rememb": [15, 18, 89, 117], "share": [15, 119], "other": [15, 16, 17, 18, 19, 22, 30, 39, 42, 50, 56, 90, 96, 97, 99, 103, 105, 106, 108, 113, 114, 116, 117, 119], "word": [15, 105, 119], "02240574": 15, "03439831": 15, "03904812": 15, "02810693": 15, "01586068": 15, "01929009": 15, "02394426": 15, "04016077": 15, "01314174": 15, "03893502": 15, "02400815": 15, "0038326": 15, "00122802": 15, "16228443": 15, "02521779": 15, "23700266": 15, "00788269": 15, "17490888": 15, "03393489": 15, "31735462": 15, "04918966": 15, "19421194": 15, "02938497": 15, "29495203": 15, "releas": [15, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 117], "resourc": [15, 116, 117], "viewer": 15, "close_extra": 15, "synchron": 15, "asynchron": 15, "garbag": 15, "04456399": 15, "04653909": 15, "01326909": 15, "02099827": 15, "03073904": 15, "00145001": 15, "03088818": 15, "03131252": 15, "03468829": 15, "01500225": 15, "01230312": 15, "01825218": 15, "registri": [15, 21], "env_fn": 15, "context": [15, 119], "daemon": 15, "worker": [15, 68], "pipe": 15, "commun": 15, "lambda": [15, 19, 20, 116], "81": [15, 96], "62": 15, "8286432": 15, "5597771": 15, "90249056": 15, "85009176": 15, "5266346": 15, "60007906": 15, "back": [15, 16, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 98, 99], "effici": [15, 19, 94, 95, 103], "subprocess": 15, "flag": [15, 94, 109], "turn": [15, 18, 23, 27, 28, 89, 90, 103, 109], "quit": [15, 117], "head": [15, 99], "spawn": [15, 106], "children": 15, "overrid": [15, 16], "inner": 15, "logic": [15, 89, 117], "degre": [15, 19, 101, 102, 103], "chanc": 15, "shoot": [15, 31, 40, 42, 47, 48, 55, 56, 65, 68, 72, 77, 78, 86], "yourself": [15, 48, 68, 89, 116, 117], "foot": [15, 99, 100, 108], "thu": [15, 24, 50, 51, 52, 53, 54, 105, 106, 109], "_worker": 15, "_worker_shared_memori": 15, "runtimeerror": 15, "serial": 15, "modular": [16, 21, 109, 117], "behavior": [16, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 96, 98, 99, 100, 101, 102, 107, 108, 109, 117], "modif": [16, 105, 106], "without": [16, 21, 46, 101, 111, 113, 116, 117], "alter": [16, 21, 24, 117], "lot": [16, 21, 116, 119], "boilerpl": [16, 21, 117], "chain": [16, 21, 92, 107], "base_env": [16, 21], "wrapped_env": [16, 17, 18, 21, 117, 119], "min_act": [16, 17, 21], "max_act": [16, 17, 21], "access": [16, 18, 23, 55], "underneath": [16, 21, 93], "anoth": [16, 39, 101, 102, 104, 105, 106, 108, 114, 116, 118, 119], "get": [16, 21, 24, 44, 47, 48, 49, 56, 66, 67, 68, 69, 71, 72, 73, 78, 88, 90, 98, 100, 101, 103, 111, 116, 118], "layer": [16, 21, 119], "bare": 16, "box2d": [16, 21, 88, 89, 90], "bipedal_walk": [16, 21, 88], "0x7f87d70712d0": [16, 21], "three": [16, 24, 27, 30, 32, 45, 53, 59, 66, 71, 72, 73, 74, 98, 100, 101, 102, 107, 108, 117], "thing": [16, 19, 24], "do": [16, 18, 19, 20, 24, 37, 49, 70, 74, 75, 89, 90, 92, 98, 99, 100, 101, 107, 108, 117, 119], "Such": 16, "actionwrapp": [16, 17], "observationwrapp": [16, 19, 117], "rewardwrapp": [16, 20], "present": [16, 92, 109, 116, 117, 118], "section": [16, 24, 75, 98, 99, 100, 101, 107, 108, 116, 117], "found": [16, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 97, 109, 116, 119], "github": [16, 97, 112, 117], "com": [16, 112, 113, 117, 119], "foundat": [16, 109, 117], "forget": [16, 117], "wrapperacttyp": [16, 17], "wrapperobstyp": [16, 19], "commonli": [16, 21], "page": [16, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "descript": [16, 117], "misc": 16, "tp": 16, "atari": [16, 21, 22, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 116], "compat": [16, 19, 21, 109, 115], "21": [16, 22, 98, 101, 102, 105, 111, 116], "filter": 16, "request": [16, 111], "anobserv": 16, "stack": [16, 19], "roll": [16, 19, 37, 105], "grai": [16, 18], "scale": [16, 18, 20, 24, 90, 98, 99, 100, 101, 107, 108, 109], "center": [16, 19, 89, 90, 93, 96, 98, 99, 101, 102], "unit": [16, 19, 58, 92, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "varianc": [16, 19, 20], "averag": [16, 20, 101, 118, 119], "augment": [16, 19], "obtain": [16, 18, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 96, 111, 118, 119], "replac": [16, 23, 111, 116], "recordvideo": [16, 18, 23], "rollout": [16, 18, 114], "save": [16, 18, 23], "rescal": [16, 21], "axbxc": [16, 19], "resiz": [16, 18], "trajectori": [16, 19, 20, 90, 101, 102], "append": [16, 19, 116, 119], "th": 16, "sometim": [16, 20, 113, 117], "still": [16, 23, 24, 116], "let": [16, 17, 20, 24, 39, 109, 116, 117, 119], "penal": [16, 75], "energi": [16, 88, 90, 93, 109], "weight": [16, 98, 99, 100, 101, 105, 106, 107, 108, 109, 118, 119], "those": [16, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 92, 97, 98, 99, 100, 101, 102, 103, 104, 108], "nevertheless": 16, "reacherrewardwrapp": 16, "reward_dist_weight": 16, "reward_ctrl_weight": 16, "reward_dist": [16, 105, 106], "reward_ctrl": [16, 105, 106], "suffici": [16, 30, 32, 34, 36, 41, 116], "simpli": [17, 18, 19, 20, 24, 117], "overwrit": [17, 19, 20], "domain": [17, 89, 92, 94, 95, 114], "sai": [17, 18], "discreteact": 17, "disc_to_cont": 17, "act": [17, 116], "__name__": 17, "__main__": 17, "print": [17, 117, 119], "among": [17, 19, 91, 97], "biped": [17, 87, 101, 102], "walker": [17, 87, 97, 106, 108], "affin": [17, 90], "75": [17, 98], "noop_max": 18, "frame_skip": [18, 98, 99, 100, 101, 107, 108], "screen_siz": 18, "84": [18, 98, 101, 102], "terminal_on_life_loss": 18, "grayscale_ob": 18, "grayscale_newaxi": 18, "scale_ob": 18, "2600": [18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "guidelin": 18, "machado": [18, 24], "et": [18, 24], "al": [18, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 116], "2018": [18, 24, 92], "revisit": [18, 24], "arcad": [18, 24, 31, 48, 50, 51, 52, 53, 54, 109], "evalu": [18, 24, 116], "protocol": [18, 24], "open": [18, 24, 37, 97, 109, 117], "problem": [18, 24, 90, 93, 96, 103, 104, 107, 109, 111, 114, 115, 118], "stage": 18, "op": 18, "pool": [18, 107], "recent": [18, 19, 20, 22], "life": [18, 30, 44, 48, 72, 76, 119], "lost": [18, 33, 41, 60, 73, 77], "loss": [18, 111, 119], "off": [18, 23, 41, 56, 64, 72, 89, 90, 112, 114], "squar": [18, 19, 73, 105, 106, 114, 117], "210x180": 18, "84x84": 18, "grayscal": [18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "colour": [18, 89], "greyscal": 18, "255": [18, 19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 117], "frequenc": 18, "experi": [18, 98, 101, 102, 103, 104, 116, 119], "whenev": [18, 30, 33, 117], "channel": 18, "axi": [18, 94, 95, 99, 101, 102, 107, 116], "dimension": [18, 21, 28, 90, 98, 99, 100, 106, 107, 108, 117], "memori": [18, 19, 94, 95], "optim": [18, 24, 88, 90, 101, 102, 109, 116, 119], "benefit": 18, "opencv": 18, "new_ob": 18, "final_reward": 18, "final_termin": 18, "final_trunc": 18, "final_don": 18, "prior": 18, "alongsid": 18, "previou": [18, 98, 101, 102, 118], "re": [18, 56, 71, 74, 117, 119], "old_env": 18, "legacyenv": 18, "retun": 18, "modern": [18, 109], "convers": [18, 22, 109], "cartpoleenv": 18, "customenv": 18, "manual": [18, 21, 23, 24, 50, 51, 52, 53, 54], "unregist": 18, "surround": 18, "test": [18, 88, 109, 117, 119], "haven": 18, "screen": [18, 24, 26, 30, 34, 39, 40, 42, 51, 57, 63, 73, 74, 98, 99, 100, 101, 102, 103, 104, 107, 108], "nativ": 18, "nonativerend": 18, "disable_render_order_enforc": 18, "classic_control": [18, 23, 91], "resetneed": 18, "deque_s": [18, 116], "At": [18, 21, 33, 44, 47, 58], "_episod": 18, "l": [18, 107], "elaps": 18, "sinc": [18, 22, 24, 50, 51, 52, 53, 54, 87, 93, 97, 106, 109, 114, 117, 118], "begin": [18, 23, 30, 33, 46, 71, 72, 73, 74, 116, 117], "num": [18, 24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "buffer": [18, 19, 89], "return_queu": [18, 116, 119], "length_queu": [18, 116], "disable_logg": 18, "intermitt": 18, "hundredth": 18, "emploi": 18, "stop": [18, 21, 68, 78, 86, 111, 116, 118], "span": 18, "strictli": 18, "logger": 18, "pop_fram": 18, "reset_clean": 18, "clear": [18, 78], "issu": [18, 21, 23, 24, 98, 100, 101, 102, 108, 117], "place": [18, 28, 93, 94, 95, 117], "\u01f9one": 18, "outermost": 18, "actual": [18, 114, 117], "_k": 18, "classic": [18, 21, 23, 90, 92, 93, 94, 95, 96, 100, 104, 107, 108, 118], "reflect": [19, 93], "2d": [19, 106], "navig": [19, 33, 69, 114, 117], "agent_posit": 19, "target_posit": 19, "throw": [19, 59], "awai": [19, 27, 67, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "freedom": [19, 101, 102, 103], "target": [19, 40, 92, 105, 106, 117, 118], "rel": [19, 92, 101, 102, 117], "relativeposit": [19, 117], "f": [19, 20, 116, 119], "ideal": 19, "subclass": 19, "accordingli": [19, 74, 117], "incorrectli": [19, 118], "randn": 19, "08319338": 19, "04635121": 19, "07394746": 19, "20877492": 19, "filter_kei": 19, "00067088": 19, "01860439": 19, "04772898": 19, "01911527": 19, "04560107": 19, "04466959": 19, "0328232": 19, "02367178": 19, "04649447": 19, "14996664": 19, "03329664": 19, "25847703": 19, "96": [19, 24, 89], "27648": 19, "num_stack": 19, "lz4_compress": 19, "lazyfram": 19, "fill": [19, 33, 117], "lz4": 19, "compress": 19, "keep_dim": 19, "uint8": [19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "singleton": 19, "axbx1": 19, "axb": 19, "epsilon": [19, 20, 116], "1e": [19, 20, 101, 107, 108, 119], "past": [19, 20], "newli": [19, 20], "stabil": [19, 20, 101, 102, 119], "pixels_onli": 19, "render_kwarg": 19, "pixel_kei": 19, "choos": [19, 117], "odict_kei": 19, "400": [19, 114], "600": 19, "discard": 19, "assertionerror": 19, "typeerror": 19, "unexpect": 19, "64": [19, 24], "03810719": 19, "03522411": 19, "02231044": 19, "01088205": 19, "03881167": 19, "16021058": 19, "0220928": 19, "28875574": 19, "becaus": [20, 23, 116, 117], "intrins": 20, "gain": [20, 34, 70, 76, 77, 80], "numer": [20, 102, 103, 104, 111, 119], "clipreward": 20, "invari": 20, "incorrect": [20, 114, 118], "gamma": [20, 118, 119], "99": [20, 119], "discount": [20, 116, 118, 119], "factor": [20, 116, 119], "mountain": [21, 91], "car": [21, 33, 49, 87, 91, 109], "four": [21, 33, 44, 89, 90, 98, 100, 108, 114, 116], "introduc": [21, 22, 23, 98, 101, 102], "core": 21, "markov": [21, 118], "decis": [21, 23, 109, 118], "theori": [21, 96, 103], "perfect": 21, "reconstruct": 21, "miss": [21, 75, 92, 114], "compon": [21, 117], "veri": [21, 90, 105, 117], "easi": [21, 60, 110], "loop": [21, 23, 109, 116], "pictur": 21, "simplifi": [21, 96], "someth": 21, "spaceship": [21, 31, 45, 76], "land": [21, 38, 72, 90], "safe": [21, 68, 90], "document": [21, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 91, 98, 101, 102, 103, 110, 116, 117], "imagin": [21, 109], "robot": [21, 23, 36, 86, 88, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 118], "destroi": [21, 27, 29, 31, 32, 33, 34, 35, 36, 39, 40, 41, 42, 45, 46, 54, 60, 71, 72, 73, 76, 77, 78, 80, 90], "enemi": [21, 28, 29, 32, 34, 35, 36, 42, 45, 46, 48, 61, 70, 71, 73, 74, 76, 77, 78, 80, 86], "exchang": 21, "crash": [21, 90], "succeed": 21, "similarli": [21, 90], "restart": 21, "train": [21, 23], "major": 21, "our": [21, 116, 117], "simpl": [21, 88, 110, 115, 118, 119], "util": [21, 22, 117], "coupl": 21, "nich": 21, "li": [21, 109], "lie": 21, "aspect": [21, 118], "regist": [22, 24], "sole": 22, "special": [22, 27, 57, 119], "gymv26environ": 22, "relev": [22, 117], "pong": [22, 24, 39, 43], "v5": [22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "signific": 22, "introduct": [22, 92, 111, 112], "signatur": 22, "previous": [22, 24, 33], "backward": [22, 99, 119], "compliant": [22, 23], "oldv21env": 22, "break": [23, 31, 39, 89], "briefli": 23, "outlin": [23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 111, 116], "stuck": [23, 27, 36, 55], "123": 23, "emul": [23, 24], "awar": 23, "randint": 23, "utilis": 23, "contrast": 23, "older": [23, 97], "definit": [23, 98, 100, 101, 118], "expand": [23, 24, 50, 51, 52, 53, 54], "blog": 23, "post": [23, 32], "soon": [23, 117], "extra": [23, 28, 33, 34, 36, 40, 42, 55, 74, 109, 116, 117], "address": 23, "associ": 23, "librari": [23, 115, 117], "primari": 23, "shouldn": [23, 117], "happen": [23, 73, 94, 95, 98, 100, 101, 102, 103, 104, 105, 106, 108, 111, 113, 114, 118], "fly": [23, 26, 31, 55, 71, 90], "shown": [23, 59, 89, 92, 118], "explan": [23, 116, 119], "summari": 23, "goalenv": 23, "reimplement": 23, "system": [23, 54, 92, 96, 103, 104, 109], "monitor": 23, "stella": 24, "adventur": [24, 43], "air": [24, 43], "raid": [24, 43], "alien": [24, 43, 45, 65, 78], "amidar": [24, 32, 43], "assault": [24, 43], "asterix": [24, 43], "asteroid": [24, 43], "atlanti": [24, 43], "licens": [24, 109, 116, 119], "download": [24, 116, 117, 118, 119], "locat": [24, 60, 109, 112, 113, 114, 117], "agre": 24, "todo": [24, 114], "legal": [24, 50, 51, 52, 53, 54], "fire": [24, 26, 28, 29, 31, 32, 35, 37, 39, 40, 50, 51, 52, 53, 54, 57, 64, 65, 67, 68, 70, 71, 73, 74, 77, 78, 80, 82, 84, 85, 90], "upright": [24, 30, 31, 35, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 63, 93, 96, 103, 104], "upleft": [24, 30, 31, 35, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 63], "downright": [24, 30, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63], "downleft": [24, 30, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63], "upfir": [24, 28, 31, 37, 50, 51, 52, 53, 54, 68, 80, 81, 82, 84, 85], "11": [24, 31, 50, 51, 52, 53, 54, 58, 61, 98, 99, 100, 101, 102, 103, 105, 106, 108, 111, 112, 116], "rightfir": [24, 26, 28, 29, 31, 32, 35, 40, 50, 51, 52, 53, 54, 58, 61, 64, 65, 67, 77, 80, 81, 84, 85], "leftfir": [24, 26, 28, 29, 31, 32, 40, 50, 51, 52, 53, 54, 58, 61, 64, 65, 67, 77, 80, 81, 84, 85], "13": [24, 31, 50, 51, 52, 53, 54, 58, 61, 98, 99, 101, 102, 105, 108, 114], "downfir": [24, 28, 31, 37, 50, 51, 52, 53, 54, 58, 61, 65, 68, 80, 82, 85], "14": [24, 50, 51, 52, 53, 54, 58, 88, 90, 98, 99, 101, 102, 105, 108, 116], "uprightfir": [24, 31, 50, 51, 52, 53, 54, 58, 61], "upleftfir": [24, 31, 50, 51, 52, 53, 54, 58, 61], "16": [24, 33, 36, 39, 45, 50, 51, 52, 53, 54, 58, 96, 98, 99, 101, 102, 105, 108, 113, 116, 119], "downrightfir": [24, 50, 51, 52, 53, 54, 58, 61], "17": [24, 36, 50, 51, 52, 53, 54, 58, 98, 99, 101, 102, 105, 108, 111], "downleftfir": [24, 50, 51, 52, 53, 54, 58, 61], "smaller": [24, 29, 31, 50, 51, 52, 53, 54], "enumer": [24, 50, 51, 52, 53, 54], "full_action_spac": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "reduc": [24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 93, 116], "difficulti": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 109], "choic": [24, 119], "player": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 109, 111, 112, 113, 114, 116], "128": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "byte": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "ram": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "exact": [24, 37, 50, 51, 52, 53, 54, 111, 116], "atariag": [24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 79, 81, 82, 83, 84, 85, 86], "determinist": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 94, 95, 117], "art": 24, "memor": 24, "sticki": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "small": [24, 54, 73, 88, 109, 110, 119], "On": [24, 65, 92, 93, 94, 95, 96], "top": [24, 39, 44, 51, 57, 59, 73, 89, 90, 91, 94, 95, 100, 103, 104, 108, 117, 119], "repeat": [24, 105], "frameskip": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "exclus": 24, "tabl": [24, 27, 28, 30, 44, 46, 101, 102, 105], "obs_typ": 24, "Its": 24, "repeat_action_prob": [24, 50, 51, 52, 53, 54], "stick": [24, 33, 55, 111, 116], "ll": [24, 57, 74, 116], "sound": 24, "lock": 24, "proper": 24, "audio": 24, "framer": [24, 102, 105, 106, 117], "best": [24, 50, 51, 52, 53, 54, 116], "practic": [24, 50, 51, 52, 53, 54, 109, 116, 118], "configur": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 91, 97, 110, 116, 117], "variat": 24, "amidardeterminist": 24, "amidarnoframeskip": 24, "ramdeterminist": 24, "ramnoframeskip": 24, "suffix": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "noframeskip": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "airraid": [24, 26], "31": [24, 31, 101, 102], "bankheist": [24, 33], "20": [24, 33, 39, 66, 74, 90, 98, 101, 102, 105, 114, 116], "24": [24, 33, 39, 64, 88, 89, 90, 93, 98, 101, 102, 116], "battlezon": [24, 34], "beamrid": [24, 35], "berzerk": [24, 43], "18": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 101, 102, 105, 108], "bowl": [24, 43], "breakout": [24, 43], "32": [24, 39, 56, 101, 102, 111, 119], "36": [24, 39, 101, 102, 112], "40": [24, 39, 64, 101, 102], "44": [24, 39, 101, 102], "carniv": [24, 43], "centiped": [24, 43], "22": [24, 41, 98, 101, 102, 105, 116], "86": [24, 41], "choppercommand": [24, 42], "crazyclimb": [24, 44], "defend": [24, 32, 43, 48, 64, 76], "demonattack": [24, 46], "doubledunk": [24, 47], "elevatoract": [24, 48], "enduro": [24, 43], "fishingderbi": 24, "freewai": [24, 43], "frostbit": [24, 43], "gopher": [24, 43], "gravitar": [24, 43], "hero": [24, 43], "icehockei": 24, "jamesbond": [24, 43], "journeyescap": 24, "kangaroo": [24, 43], "krull": [24, 43], "kungfumast": [24, 61], "montezumareveng": [24, 62], "mspacman": [24, 63], "namethisgam": [24, 64], "phoenix": [24, 43], "pitfal": [24, 43, 88], "pooyan": [24, 43], "50": [24, 58, 68, 74, 90, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 119], "70": [24, 68], "privateey": 24, "qbert": [24, 43], "riverraid": [24, 43], "roadrunn": [24, 72], "robotank": [24, 43, 73], "seaquest": [24, 43], "ski": [24, 43], "solari": [24, 43], "spaceinvad": 24, "stargunn": 24, "tenni": [24, 43], "timepilot": 24, "tutankham": [24, 43], "upndown": [24, 82], "ventur": [24, 43], "videopinbal": [24, 84, 85], "wizardofwor": [24, 85], "yarsreveng": 24, "zaxxon": [24, 43], "oppos": 24, "ai": [24, 109], "mg": 24, "bellemar": 24, "naddaf": 24, "j": [24, 119], "veness": 24, "platform": 24, "journal": [24, 114], "artifici": [24, 114], "intellig": [24, 114], "research": [24, 97, 103, 114], "2012": 24, "url": 24, "jair": [24, 114], "php": 24, "articl": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "view": [24, 54], "11182": 24, "250": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "160": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "enchant": [25, 41], "chalic": 25, "golden": 25, "castl": 25, "pick": [25, 48, 59, 72, 114, 116], "sword": 25, "bridg": [25, 71, 109], "magnet": 25, "fight": [25, 38, 61, 64, 109], "outmanoeuvr": 25, "dragon": 25, "flavor": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "switch": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 109], "thorough": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "discuss": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "intric": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "stochast": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 91, 92, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 112, 114], "ship": [26, 27, 29, 35, 45, 54, 76], "sidewai": [26, 29, 35, 71, 75], "protect": [26, 32, 41, 42, 53, 58, 68], "saucer": [26, 31, 78], "try": [26, 27, 28, 37, 39, 44, 67, 68, 116], "drop": [26, 33, 114], "bomb": [26, 45, 57, 65, 78], "meaning": [26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85], "210": [27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 45, 46, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "maze": [27, 28, 33, 36, 62, 81], "egg": 27, "scatter": [27, 69], "simultan": [27, 28], "kill": [27, 36, 55, 60], "flamethrow": 27, "tricki": 27, "situat": [27, 114], "occasion": [27, 31], "power": [27, 55, 89, 90, 95, 103, 104, 119], "pulsar": 27, "temporari": 27, "abil": 27, "score": [27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 74, 78, 79, 80, 84, 88, 90], "prize": [27, 82], "caught": [27, 33], "lose": [27, 30, 32, 41, 44, 45, 48, 55, 57, 66, 67, 69, 71, 72, 74, 75, 76, 90, 111, 116], "consult": [27, 56, 57, 58, 59, 60], "pac": 28, "man": 28, "visit": [28, 48, 89], "grid": [28, 112, 113, 114, 116, 117], "chicken": [28, 40, 51], "catch": [28, 44, 50, 72], "travers": 28, "vehicl": [29, 34, 49, 58], "big": [29, 50, 117], "mother": [29, 59, 68], "circl": [29, 117], "overhead": [29, 90], "deploi": 29, "drone": 29, "dodg": [29, 35, 74], "attack": [29, 31, 32, 35, 43, 45, 68], "horizont": [30, 40, 88, 90, 92, 117], "vertic": [30, 88, 103, 104, 117], "lyre": 30, "guid": [30, 51, 109], "award": [30, 36, 41, 44, 48, 74, 103, 104], "field": 31, "appear": [31, 33, 36, 73, 94, 95], "satellit": 31, "ufo": 31, "job": [32, 117], "submerg": 32, "citi": [32, 33, 69], "slowli": 32, "descend": 32, "toward": [32, 56, 107], "strike": [32, 37], "distanc": [32, 49, 99, 117], "defens": [32, 47], "manag": [32, 37], "seven": 32, "fought": 32, "wave": [32, 42, 46, 58, 65, 78], "outer": [32, 92], "robber": 33, "natur": [33, 111, 113, 116], "rob": 33, "getawai": 33, "polic": 33, "chase": [33, 36], "dynamit": [33, 55], "ga": [33, 89], "tank": [33, 34, 74], "nine": [33, 98], "leav": [33, 93, 97, 103, 117], "person": [34, 92, 109], "perspect": [34, 109], "3d": [34, 98, 101, 102, 109, 116], "illus": 34, "radar": [34, 85], "travel": 35, "steer": [35, 82, 89], "debri": 35, "leftifir": 35, "evil": [36, 61, 86], "touch": [36, 69, 117], "wall": [36, 39, 55, 94, 95, 114], "undefeat": 36, "otto": 36, "tri": 37, "knock": [37, 38], "pin": 37, "spar": 37, "spare": 37, "300": [37, 49, 88, 117], "oppon": [38, 50, 56, 67, 82], "ring": 38, "hit": [38, 39, 40, 41, 46, 68, 69, 72, 73, 75, 111, 116], "punch": [38, 59], "famou": 39, "paddl": [39, 67], "ball": [39, 56, 67, 84], "brick": 39, "wreak": 39, "havoc": 39, "five": [39, 69, 75, 91, 119], "214": 40, "em": 40, "gun": [40, 48], "suppli": [40, 64, 118], "ammunit": 40, "steal": [40, 50], "bullet": [40, 109], "subtract": 40, "minu": 40, "sign": [40, 103, 104, 119], "elf": [41, 113], "magic": 41, "wand": 41, "fend": 41, "spider": 41, "flea": 41, "mushroom": 41, "forest": 41, "bitten": 41, "tempor": 41, "paralyz": 41, "scorpion": 41, "round": 41, "helicopt": [42, 44, 71], "truck": [42, 72], "convoi": 42, "aircraft": [42, 80], "mini": 42, "bottom": [42, 57, 89, 94, 95, 100, 108, 112], "plane": 42, "surviv": [42, 46], "bank": [43, 71], "heist": 43, "battl": 43, "zone": 43, "beam": [43, 55], "rider": 43, "chopper": 43, "command": [43, 97], "crazi": 43, "climber": 43, "demon": 43, "doubl": [43, 97], "dunk": 43, "elev": 43, "fish": 43, "derbi": 43, "ic": [43, 46, 52, 56, 113], "hockei": [43, 56], "journei": [43, 58, 116], "kung": 43, "fu": 43, "master": [43, 112, 119], "montezuma": 43, "reveng": 43, "pacman": 43, "privat": [43, 69, 117], "ey": [43, 64, 69], "road": [43, 89], "runner": 43, "invad": [43, 77], "star": 43, "gunner": 43, "pilot": [43, 65, 86], "pinbal": 43, "wizard": [43, 61], "Of": 43, "wor": 43, "yar": 43, "builid": 44, "obstacl": [44, 58, 59], "fall": [44, 46, 66, 72, 88, 101, 112, 113, 118], "damag": [44, 73], "climb": [44, 59, 91], "fast": [44, 89, 97, 99, 101, 103, 107, 109], "least": [44, 79, 90], "row": [44, 77, 112, 113], "earth": [45, 77], "rescu": [45, 55, 59, 60, 61, 74, 76], "smart": 45, "shot": [45, 47, 48, 56, 57, 72, 109], "abduct": 45, "unlimit": 45, "laser": [45, 55, 77, 85], "missil": [45, 71], "aliv": [45, 101, 108], "face": [46, 98, 101, 102, 111, 116], "planet": [46, 54, 76], "krybor": 46, "accumul": 46, "reserv": [46, 71, 73, 74], "bunker": [46, 54], "increas": [46, 74, 90, 92, 93, 100, 107, 108, 116], "grant": [46, 90], "slai": 46, "2v2": 47, "basketbal": 47, "possess": 47, "rival": 47, "team": 47, "rule": [47, 79, 109, 111, 116], "foul": 47, "success": [47, 92, 114, 118], "secret": [48, 69], "ground": [48, 68, 88, 90, 98, 102, 109], "stair": 48, "equip": 48, "against": [48, 67, 79, 109], "floor": 48, "gather": [48, 69, 117], "apart": [48, 117], "mark": 48, "red": [48, 54, 114, 117], "door": 48, "unreleas": 48, "prototyp": 48, "500": [48, 71, 92, 93, 114, 116], "racer": 49, "nation": 49, "long": [49, 84, 93, 103, 104], "endur": 49, "race": [49, 72, 75, 87], "overtak": 49, "dai": [49, 87], "stai": 49, "meet": 49, "quota": 49, "sunfish": 50, "But": [50, 75], "fisherman": 50, "black": [50, 60, 92, 116], "shark": [50, 64, 74], "lurk": [50, 70], "surfac": [50, 74, 103, 104, 117], "lane": [51, 109], "busi": 51, "rush": 51, "hour": 51, "traffic": [51, 109], "cross": [51, 112, 113], "bailei": 52, "who": [52, 53, 58, 59, 75], "hop": [52, 70, 100, 108], "forth": 52, "arctic": 52, "river": [52, 71], "block": 52, "white": 52, "blue": [52, 54, 79, 92, 114, 117], "he": [52, 54], "hi": [52, 54, 69], "igloo": 52, "shovel": 53, "wield": 53, "farmer": 53, "crop": 53, "carrot": 53, "spacecraft": 54, "fiction": 54, "solar": 54, "landscap": 54, "miner": 55, "mine": [55, 72], "shaft": 55, "tool": [55, 62], "propel": 55, "backpack": 55, "wherev": 55, "blast": [55, 74, 76], "vermin": 55, "raft": 55, "stretch": 55, "critter": 55, "remain": [55, 58, 59, 74, 98, 112, 117, 118], "standard": [56, 98, 99, 103, 109, 119], "minut": [56, 66], "period": [56, 100, 108], "puck": 56, "angl": [56, 57, 88, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "extrem": [56, 109, 110], "rink": 56, "realli": [56, 116], "mr": 57, "bond": 57, "design": [57, 92, 98, 101, 102, 109, 110, 114, 117], "multipurpos": 57, "craft": [57, 90], "varieti": [57, 109], "motion": [57, 109], "slightli": [57, 88, 98], "jump": [57, 72, 75], "dive": 57, "lob": 57, "rate": [57, 74, 116, 119], "highest": 57, "novic": 57, "006": 57, "007": 57, "lead": 58, "peski": 58, "backstag": 58, "scarab": 58, "000": [58, 71, 74], "concert": 58, "cash": 58, "grasp": 58, "groupi": 58, "photograph": 58, "promot": 58, "encount": [58, 59, 80], "her": [59, 68], "preciou": 59, "babi": 59, "ladder": [59, 88], "bonu": [59, 73, 74, 78, 108], "fruit": 59, "monkei": 59, "corner": 59, "beast": 60, "fortress": [60, 62], "princess": [60, 61], "lyssa": 60, "sunris": 60, "monster": [60, 83], "templ": 61, "victoria": 61, "defeat": [61, 70], "acquir": [62, 97], "treasur": [62, 64, 66, 81, 83], "chamber": [62, 83], "emperor": 62, "deadli": 62, "creatur": [62, 70, 78, 109], "valuabl": 62, "pellet": 63, "ghost": 63, "discov": 64, "octopu": 64, "oxygen": [64, 74], "elimin": [65, 81, 82, 83], "war": 65, "bird": 65, "harri": 66, "jungl": 66, "die": [66, 68, 89], "misfortun": 66, "hole": [66, 113], "compet": 67, "deflect": 67, "pig": 68, "piglet": 68, "wolv": 68, "rope": 68, "balloon": 68, "guard": 68, "eat": [68, 72], "bait": 68, "wolf": 68, "stone": 68, "rock": [68, 72], "french": 69, "pierr": 69, "street": 69, "park": 69, "passag": 69, "dead": 69, "search": 69, "ringlead": 69, "henri": 69, "le": 69, "fiend": 69, "gang": 69, "evid": 69, "stolen": 69, "good": [69, 116], "statut": 69, "expir": 69, "nab": 69, "question": [69, 109], "auto": 69, "pothol": 69, "q": [70, 114, 118], "bert": 70, "cube": 70, "pyramid": 70, "destin": [70, 114], "nasti": 70, "jet": 71, "fli": 71, "fuel": [71, 76, 90], "depot": 71, "collid": [71, 74, 90], "squadron": [71, 73], "tanker": 71, "80": [71, 113], "tm": 72, "direct": [72, 74, 92, 93, 94, 95, 98, 100, 101, 103, 104, 108, 112, 113, 114, 117, 119], "outrun": 72, "wile": 72, "coyot": 72, "hazard": 72, "desert": 72, "rocket": [72, 73, 90], "cannon": [72, 77], "cliff": [72, 110], "steel": 72, "pile": 72, "birdse": 72, "cannonbal": 72, "activ": [73, 117], "scrambl": 73, "static": 73, "interfer": 73, "sensor": [73, 89], "report": [73, 88, 98, 101, 102], "flash": 73, "panel": 73, "c": [73, 90, 92, 119], "earn": 73, "twelv": 73, "abl": [74, 118], "torpedo": 74, "diver": 74, "killer": 74, "deliv": [74, 114], "six": [74, 108], "explod": 74, "anyth": 74, "decreas": [74, 90], "almost": 74, "yoursub": 74, "blow": 74, "forc": [74, 76, 90, 93, 94, 95, 98, 101, 102, 103, 104, 119], "less": [74, 88, 90, 103, 107], "worth": [74, 77], "90": [74, 116], "skier": 75, "gate": 75, "fastest": 75, "slalom": 75, "penalti": [75, 114], "warp": 76, "sector": 76, "feder": 76, "zylon": 76, "refuel": 76, "cadet": 76, "corridor": 76, "mania": [78, 80], "orang": 79, "win": [79, 111, 116], "margin": 79, "ti": 79, "sport": 79, "till": [79, 116], "technologi": 80, "increasingli": 80, "difficult": [80, 93, 97, 103, 104], "rack": 81, "tomb": 81, "guardian": 81, "baja": 82, "bugger": 82, "dungeon": 83, "beat": [85, 111], "scanner": 85, "armi": 86, "enslav": 86, "galaxi": 86, "fighter": 86, "lunar": 87, "lander": 87, "toi": [87, 111, 112, 113, 114], "contribut": 87, "earli": [87, 116, 119], "oleg": [87, 88, 89, 90], "klimov": [87, 88, 89, 90], "popular": [87, 109, 116], "benchmark": 87, "ever": 87, "joint": [88, 90, 92, 93, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "uneven": 88, "terrain": [88, 109], "hardcor": 88, "stump": 88, "1600": 88, "heurist": [88, 90], "demonstr": [88, 109], "motor": [88, 107], "hip": [88, 98, 101, 102], "knee": [88, 101, 102], "hull": 88, "angular": [88, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "leg": [88, 90, 98, 100, 101, 102, 108], "contact": [88, 90, 97, 98, 101, 102, 103], "lidar": 88, "rangefind": 88, "measur": [88, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108], "far": [88, 89, 103, 105, 106, 113], "torqu": [88, 92, 96, 98, 99, 100, 101, 102, 105, 106, 107, 108], "cost": [88, 99, 100, 107, 108, 109], "better": 88, "stand": [88, 97, 98, 101, 102, 103, 104, 116], "slight": 88, "exce": [88, 111], "closest": 88, "trace": 88, "furthest": 88, "faster": [88, 90, 102], "spent": [88, 90], "friction": [88, 107, 109], "nervous": 88, "easiest": 89, "ab": 89, "wheel": 89, "gyroscop": 89, "car_rac": 89, "rear": 89, "drive": 89, "brake": 89, "96x96": 89, "tile": 89, "732": 89, "926": 89, "rest": [89, 90, 100, 108], "playfield": 89, "lap_complete_perc": 89, "dictat": [89, 90], "percentag": [89, 116], "lap": 89, "domain_random": 89, "variant": [89, 117], "scenario": [89, 109], "background": 89, "demand": 89, "correspondingli": 89, "init": [89, 117], "scheme": [89, 109], "chri": 89, "campbel": 89, "2014": 89, "www": [89, 111, 112, 113], "iforce2d": 89, "net": [89, 111, 112, 119], "b2dtut": 89, "pontryagin": 90, "principl": 90, "engin": [90, 97], "throttl": 90, "why": 90, "pad": 90, "infinit": [90, 100, 108, 111, 116, 118], "lunar_land": 90, "orient": [90, 98, 101, 102], "sum": [90, 98, 99, 100, 101, 102, 105, 106, 107, 108, 111, 116], "closer": [90, 111], "slower": 90, "tilt": 90, "03": 90, "solut": [90, 116], "viewport": 90, "mass": [90, 98, 99, 101, 102, 107], "bodi": [90, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108], "moon": 90, "greater": [90, 92, 93, 94, 95, 99, 104, 105, 107, 111, 116], "awak": 90, "group": 90, "come": [90, 98, 99, 100, 101, 102, 103, 104, 107, 108], "sleep": 90, "littl": [90, 102], "cpu": 90, "wake": 90, "attach": [90, 93, 96, 98, 108], "graviti": [90, 93, 94, 96, 103, 104, 119], "enable_wind": 90, "wind_pow": 90, "turbulence_pow": 90, "later": [90, 116, 119], "booster": 90, "gravit": 90, "wind": 90, "tanh": [90, 119], "sin": [90, 96, 103], "pi": [90, 92, 96], "9999": 90, "rotat": [90, 92, 98, 101, 102, 105, 116], "turbul": 90, "renorm": 90, "harder": 90, "push": [90, 93, 103, 104, 109, 119], "cart": [91, 103, 104, 119], "nois": [91, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "regard": 91, "underpow": 91, "effort": 91, "easier": 91, "ones": [91, 97, 116], "57": 92, "spars": [92, 117], "coars": 92, "barto": [92, 93, 103, 104, 111, 112, 116], "book": [92, 111, 112, 116], "link": [92, 98, 99, 100, 101, 102, 106, 107], "linearli": [92, 103, 104, 119], "actuat": [92, 93, 101, 102], "swing": [92, 96], "free": [92, 96, 97, 98, 101, 102, 103, 104, 109, 116, 119], "height": [92, 100, 103, 108], "hang": 92, "downward": 92, "seen": [92, 99], "green": [92, 114], "cosin": [92, 103, 106], "theta1": 92, "sine": [92, 103, 106], "theta2": 92, "567": 92, "274": 92, "4\u03c0": 92, "9\u03c0": 92, "rad": [92, 93, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "incur": [92, 112, 114], "co": [92, 94, 95, 96, 103, 106, 109], "book_or_nip": 92, "neurip": 92, "paper": [92, 103, 114], "nip": 92, "equat": [92, 96], "confirm": 92, "radian": [92, 93, 96, 104], "1996": 92, "touretzki": 92, "mozer": 92, "hasselmo": 92, "ed": 92, "vol": [92, 114], "mit": [92, 116, 119], "proceed": 92, "cc": 92, "1995": 92, "8f1d43620bc6bb580df6e80b0dc05c48": 92, "pdf": [92, 111, 112], "anderson": [93, 103, 104], "neuronlik": [93, 103, 104], "adapt": [93, 103, 104, 112], "un": 93, "frictionless": 93, "balanc": [93, 103, 104, 119], "vari": [93, 103, 104, 119], "418": 93, "untermin": 93, "2095": 93, "allot": 93, "475": 93, "05": [93, 98, 99, 105], "07": [94, 95], "sinusoid": [94, 95], "vallei": [94, 95], "strateg": [94, 95], "hill": [94, 95], "andrew": [94, 95], "moor": [94, 95], "phd": [94, 95, 107], "thesi": [94, 95, 107], "1990": [94, 95], "techreport": [94, 95], "moore90efficientmemori": [94, 95], "author": [94, 95, 109, 116, 119], "william": [94, 95, 119], "institut": [94, 95], "univers": [94, 95], "cambridg": [94, 95], "year": [94, 95], "001": [94, 96, 100, 103, 108, 116], "0025": [94, 95], "collis": [94, 95], "inelast": [94, 95], "upon": [94, 95], "quickli": [94, 116], "penalis": [94, 95, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108], "equal": [94, 95, 103, 111, 113], "0015": 95, "45": [95, 102, 105], "999": 95, "invert": [96, 97, 119], "swingup": 96, "diagram": 96, "meter": 96, "theta": 96, "tau": 96, "counter": 96, "clockwis": 96, "theta_dt": 96, "heta": 96, "2736044": 96, "calcul": [96, 97, 98, 101, 102, 103, 105, 106, 112, 113, 114], "math": 96, "half": 97, "cheetah": 97, "standup": 97, "facilit": [97, 109], "develop": [97, 119], "biomechan": 97, "graphic": [97, 109], "anim": 97, "area": 97, "accur": 97, "octob": 97, "2021": [97, 109], "deepmind": 97, "2022": 97, "everyon": 97, "instruct": [97, 117], "websit": [97, 109], "framework": 97, "ten": [97, 111, 116], "iverteddoublependulum": 97, "gaussian": 97, "mjsim": 97, "qpo": 97, "qvel": [97, 101, 102], "indirectli": 97, "xml": [97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "tweak": [97, 107], "schulman": 98, "moritz": 98, "levin": 98, "jordan": 98, "abbeel": 98, "advantag": [98, 109, 117], "estim": [98, 118, 119], "torso": [98, 99, 100, 101, 102, 108], "eight": 98, "hing": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "rotor": [98, 99, 100, 101, 102, 107, 108], "front": [98, 99, 107], "hip_1": [98, 101, 102], "front_left_leg": [98, 101, 102], "angle_1": [98, 101, 102], "hip_2": [98, 101, 102], "front_right_leg": [98, 101, 102], "angle_2": 98, "hip_3": 98, "back_leg": 98, "angle_3": 98, "hip_4": 98, "right_back_leg": 98, "angle_4": 98, "deriv": [98, 99, 100, 101, 102, 103, 104, 107, 108, 119], "exclude_current_positions_from_observ": [98, 99, 100, 101, 107, 108], "113": 98, "regardless": [98, 99, 100, 101, 107, 108], "x_posit": [98, 99, 100, 101, 107, 108], "y_posit": [98, 101, 107], "111": 98, "z": [98, 99, 100, 101, 102, 105, 106, 108], "centr": [98, 101, 102], "ankle_1": 98, "ankle_2": 98, "ankle_3": 98, "ankle_4": 98, "19": [98, 101, 102, 105], "23": [98, 101, 102, 105, 109], "translat": [98, 101, 102, 117], "dof": [98, 101, 102], "quaternion": [98, 101, 102], "healthy_reward": [98, 100, 101, 108], "healthi": [98, 100, 101, 108], "forward_reward": [98, 99, 100, 101, 107, 108], "dt": [98, 99, 100, 101, 105, 106, 107, 108], "frametim": [98, 99, 100, 101, 107, 108], "ctrl_cost": [98, 99, 100, 101, 107, 108], "too": [98, 99, 100, 101, 102, 103, 105, 106, 107, 108], "ctrl_cost_weight": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "ctr_cost_weight": 98, "contact_cost": [98, 101], "contact_cost_weight": [98, 101], "contact_force_rang": 98, "reset_noise_scal": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "deviat": [98, 99, 103, 107, 119], "intention": [98, 101, 102], "therebi": [98, 101, 102], "unhealthi": [98, 100, 101, 108], "healthy_z_rang": [98, 100, 101, 108], "terminate_when_unhealthi": [98, 100, 101, 108], "xml_file": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "path": [98, 99, 100, 101, 105, 106, 107, 108, 113], "model": [98, 99, 100, 101, 107, 108, 109, 116], "5e": [98, 100, 101, 108], "perturb": [98, 99, 100, 101, 107, 108], "induct": [98, 99, 100, 101, 107, 108], "bia": [98, 99, 100, 101, 107, 108], "induc": [98, 99, 100, 101, 107, 108], "agnost": [98, 99, 100, 101, 102, 107, 108], "bind": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "camera": [98, 99, 100, 101, 102, 103, 104, 107, 108], "mujoco_pi": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "max_time_step": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "p": [99, 109, 112, 113, 114], "wawrzy\u0144ski": 99, "cat": 99, "paw": 99, "alloc": 99, "thigh": [99, 100, 101, 102, 108], "shin": [99, 101, 102], "feet": [99, 108], "bthigh": 99, "bshin": 99, "bfoot": 99, "fthigh": 99, "fshin": 99, "ffoot": 99, "tip": [99, 103, 107], "rootz": [99, 100, 108], "slide": [99, 100, 103, 104, 105, 106, 107, 108], "rooti": [99, 100, 108], "rootx": [99, 100, 108], "forward_reward_weight": [99, 100, 101, 107, 108], "half_cheetah": 99, "erez": [100, 101, 102, 108], "tassa": [100, 101, 102, 108], "todorov": [100, 101, 102, 108], "predict": [100, 108, 119], "nonlinear": [100, 108], "compar": [100, 107, 108, 116], "figur": [100, 108, 116, 119], "middl": [100, 108], "thigh_joint": [100, 108], "leg_joint": [100, 108], "foot_joint": [100, 108], "002": [100, 108], "008": [100, 108], "els": [100, 108, 113, 116, 117], "healthy_state_rang": 100, "fallen": 100, "healthy_angle_rang": [100, 108], "376": [101, 102], "synthesi": [101, 102], "onlin": [101, 102, 109, 111, 112], "abdomen": [101, 102], "pair": [101, 102], "arm": [101, 102, 105, 106, 109], "elbow": [101, 102, 105], "walk": [101, 108, 110, 113, 117], "right_hip_x": [101, 102], "right_thigh": [101, 102], "right_hip_z": [101, 102], "right_hip_i": [101, 102], "right_kne": [101, 102], "left_hip_x": [101, 102], "left_thigh": [101, 102], "left_hip_z": [101, 102], "left_hip_i": [101, 102], "left_kne": [101, 102], "right_shoulder1": [101, 102], "right_shoulder2": [101, 102], "right_elbow": [101, 102], "left_shoulder1": [101, 102], "left_shoulder2": [101, 102], "left_elbow": [101, 102], "378": 101, "root": [101, 102], "lower_waist": [101, 102], "abdomen_z": [101, 102], "abdomen_i": [101, 102], "pelvi": [101, 102], "abdomen_x": [101, 102], "right_upper_arm": [101, 102], "right_lower_arm": [101, 102], "left_upper_arm": [101, 102], "left_lower_arm": [101, 102], "anglular": [101, 102, 104], "29": [101, 102], "aanglular": [101, 102], "33": [101, 102], "34": 101, "35": [101, 102], "37": [101, 102], "39": [101, 102], "41": [101, 102], "43": [101, 102], "velocitti": 101, "addition": [101, 102], "cinert": [101, 102], "inertia": [101, 102], "rigid": [101, 102], "intermedi": [101, 102], "nbodi": [101, 102], "henc": [101, 102, 110, 119], "140": [101, 102], "cvel": [101, 102], "qfrc_actuat": [101, 102], "constraint": [101, 102, 103, 109], "nv": [101, 102], "cfrc_ext": [101, 102], "dim": [101, 102], "003": 101, "015": 101, "nu": [101, 102], "contact_cost_rang": 101, "lai": 102, "state_spac": 102, "uph_cost": 102, "upward": 102, "absolut": [102, 104, 108], "overal": 102, "atom": 102, "movement": [102, 117], "though": 102, "inflat": 102, "quad_ctrl_cost": 102, "quad_impact_cost": 102, "000001": 102, "105": 102, "unlik": [102, 103, 104, 105, 106, 119], "beyond": [102, 103, 104, 105, 106, 108], "slider": [103, 104], "unitless": [103, 106], "hinge2": 103, "realist": [103, 109], "accuraci": 103, "approach": [103, 116, 117, 119], "analyt": 103, "alive_bonu": 103, "distance_penalti": 103, "velocity_penalti": 103, "005": [103, 105, 106], "y_coordin": 103, "196": 103, "perpendicularli": 103, "cylind": 105, "effector": [105, 106], "fingertip": [105, 106], "shoulder": 105, "forearm": 105, "wrist": 105, "pan": 105, "r_shoulder_pan_joint": 105, "lift": 105, "r_shoulder_lift_joint": 105, "r_upper_arm_roll_joint": 105, "flex": 105, "r_elbow_flex_joint": 105, "r_forearm_roll_joint": 105, "r_wrist_flex_joint": 105, "r_wrist_roll_joint": 105, "analogi": 105, "tips_arm": 105, "obj_slidex": 105, "obj_slidei": 105, "goal_slidex": 105, "goal_slidei": 105, "sphere": 105, "reward_near": 105, "unattach": [105, 106], "reward_control": [105, 106], "euclidean": [105, 106], "perman": 105, "323": 105, "rise": 105, "asset": [105, 106, 109, 113], "gymnasmium": 105, "fixtur": 106, "joint0": 106, "joint1": 106, "target_x": 106, "target_i": 106, "position_fingertip": 106, "position_target": 106, "na": 106, "disk": 106, "radiu": 106, "everyth": 106, "02": 106, "r\u00e9mi": 107, "coulom": 107, "applic": [107, 109], "segment": 107, "articul": [107, 109], "suspend": 107, "subject": 107, "fluid": 107, "viscou": 107, "coeffici": 107, "motor1_rot": 107, "motor2_rot": 107, "\u03b8": 107, "free_body_rot": 107, "slider1": 107, "slider2": 107, "04": 107, "swim": 107, "split": 108, "thigh_left_joint": 108, "leg_left_joint": 108, "foot_left_joint": 108, "ctr_cost": 108, "procedur": [109, 119], "clone": [109, 117], "huge": 109, "3v3": 109, "hundr": 109, "roughli": 109, "tweakabl": 109, "monei": 109, "slime": 109, "volleybal": 109, "motiv": 109, "premad": 109, "foss": 109, "interoper": 109, "extens": [109, 119], "light": 109, "poli": 109, "pinocchio": 109, "meshcat": 109, "web": 109, "bitcraz": 109, "crazyfli": 109, "nanoquadrotor": 109, "endeavor": 109, "gap": 109, "deep": [109, 118, 119], "methodologi": 109, "coverag": 109, "laboratori": 109, "internet": 109, "quadrotor": 109, "casadi": 109, "symbol": 109, "priori": 109, "isaac": 109, "omnivers": 109, "cours": 109, "wide": 109, "account": 109, "yield": 109, "voltag": 109, "duti": 109, "cycl": 109, "plan": 109, "emphasi": 109, "percept": 109, "social": 109, "driver": 109, "whose": [109, 111], "uncertain": 109, "merg": 109, "intersect": 109, "roundabout": 109, "latent": 109, "transfer": 109, "miniatur": 109, "racecar": 109, "llvm": 109, "phase": 109, "gcc": 109, "cuda": 109, "p_0": 109, "morl": 109, "cell": [109, 112, 117], "warehous": 109, "storag": 109, "overfit": 109, "predefin": [109, 117], "hyperparamet": [109, 116, 119], "cheap": 109, "surrog": 109, "evolutionari": 109, "tag": 109, "answer": 109, "classif": 109, "dataset": 109, "autom": 109, "prover": 109, "vampir": 109, "theoret": 109, "workshop": 109, "minatari": 109, "bsuit": 109, "great": [109, 116], "focu": 109, "simplic": 109, "comprehens": 109, "crypto": 109, "omg": 109, "toolbox": 109, "minimalist": 109, "synthes": 109, "neuro": 109, "architectur": 109, "integr": 109, "twin": 109, "concept": 109, "seamless": 109, "firmwar": 109, "neuroflight": 109, "frozen": 110, "lake": 110, "suitabl": 110, "card": [111, 116], "dealer": [111, 116], "deck": [111, 116], "jack": 111, "queen": 111, "king": 111, "ac": [111, 116], "usabl": [111, 116], "held": 111, "decid": 111, "bust": [111, 116], "reveal": 111, "facedown": 111, "goe": 111, "outcom": 111, "hand": [111, 119], "sab": [111, 116], "2020": [111, 112], "incompleteidea": [111, 112], "rlbook2020": [111, 112], "48": 112, "4x12": 112, "world": [112, 113, 114], "132": 112, "inspir": 112, "dennybritz": 112, "blob": 112, "cliff_walk": 112, "latter": 112, "current_row": [112, 113], "nrow": [112, 113], "current_col": [112, 113], "col": [112, 113], "47": 112, "proabil": [112, 114], "slipperi": 113, "extent": 113, "4x4": 113, "perpendicular": 113, "is_slipperi": 113, "stool": 113, "franuka": 113, "itch": 113, "io": 113, "rpg": 113, "snow": 113, "tileset": 113, "mel": 113, "tilleri": 113, "cyaneu": 113, "ncol": [113, 116], "time_limit": [113, 114], "8x8": 113, "desc": 113, "map_nam": 113, "preload": 113, "sfff": 113, "fhfh": 113, "fffh": 113, "hffg": 113, "generate_random_map": 113, "toy_text": [113, 116], "frozen_lak": 113, "sfffffff": 113, "ffffffff": 113, "fffhffff": 113, "fffffhff": 113, "fhhfffhf": 113, "fhffhfhf": 113, "fffhfffg": 113, "bug": 113, "passeng": 114, "yellow": 114, "5x5": 114, "maxq": 114, "decomposit": 114, "tom": 114, "dietterich": 114, "pickup": 114, "south": 114, "north": 114, "east": 114, "west": 114, "letter": 114, "taxi_row": 114, "taxi_col": 114, "passenger_loc": 114, "404": 114, "reachabl": 114, "illeg": 114, "action_mask": 114, "fickl": 114, "Or": 114, "argmax": [114, 116], "q_valu": [114, 116], "pp": 114, "227": 114, "303": 114, "nov": 114, "doi": 114, "1613": 114, "639": 114, "cleaner": 114, "disallow": 114, "loc": 114, "passidx": 114, "maintain": 115, "capabl": 115, "insert": [115, 119], "casino": 116, "infam": 116, "beatabl": 116, "won": 116, "viabl": 116, "strategi": 116, "favorit": 116, "zemann": 116, "__future__": [116, 119], "annot": [116, 119], "defaultdict": 116, "pyplot": [116, 119], "plt": [116, 119], "seaborn": [116, 119], "sn": [116, 119], "patch": 116, "tqdm": 116, "explanatori": 116, "tell": [116, 118], "idea": [116, 118], "slow": 116, "showcas": 116, "respond": 116, "harm": 116, "greedi": 116, "blackjackag": 116, "learning_r": [116, 119], "initial_epsilon": 116, "epsilon_decai": 116, "final_epsilon": 116, "discount_factor": 116, "95": 116, "arg": [116, 119], "decai": 116, "lr": [116, 119], "training_error": 116, "get_act": 116, "greedili": 116, "exploit": 116, "next_ob": [116, 119], "future_q_valu": 116, "temporal_differ": 116, "decay_epsilon": 116, "readi": 116, "n_episod": 116, "100_000": 116, "start_epsilon": 116, "decent": [116, 119], "converg": 116, "10x": 116, "rolling_length": 116, "fig": 116, "subplot": 116, "figsiz": [116, 119], "set_titl": 116, "reward_moving_averag": 116, "convolv": 116, "length_moving_averag": 116, "training_error_moving_averag": 116, "tight_layout": 116, "create_grid": 116, "usable_ac": 116, "state_valu": 116, "action_valu": 116, "player_count": 116, "dealer_count": 116, "meshgrid": 116, "arang": 116, "apply_along_axi": 116, "arr": 116, "dstack": 116, "value_grid": 116, "policy_grid": 116, "create_plot": 116, "figaspect": 116, "suptitl": 116, "fontsiz": 116, "ax1": 116, "add_subplot": 116, "plot_surfac": 116, "rstride": 116, "cstride": 116, "cmap": 116, "viridi": 116, "edgecolor": 116, "xtick": 116, "ytick": 116, "set_xlabel": 116, "set_ylabel": 116, "zaxi": 116, "set_rotate_label": 116, "set_zlabel": 116, "view_init": 116, "220": 116, "ax2": 116, "heatmap": 116, "linewidth": 116, "accent_r": 116, "cbar": 116, "set_xticklabel": 116, "set_yticklabel": 116, "legend": 116, "legend_el": 116, "facecolor": 116, "lightgreen": 116, "label": 116, "grei": 116, "bbox_to_anchor": 116, "fig1": 116, "fig2": 116, "hopefulli": 116, "grip": 116, "challeng": 116, "mont": [116, 119], "carlo": [116, 119], "fun": [116, 119], "blackjack_tutori": 116, "ipynb": [116, 117, 118, 119], "overview": [117, 119], "virtual": 117, "git": 117, "venv": 117, "bin": 117, "concern": [117, 119], "readm": 117, "setup": 117, "gym_exampl": 117, "grid_world": 117, "relative_posit": 117, "reacher_weighted_reward": 117, "discrete_act": 117, "clip_reward": 117, "illustr": [117, 118], "simplist": 117, "gridworldenv": 117, "piec": 117, "abstract": 117, "window_s": 117, "512": 117, "_action_to_direct": 117, "assert": 117, "clock": 117, "_get_ob": 117, "mandatori": 117, "_agent_loc": 117, "_target_loc": 117, "manhattan": 117, "_get_info": 117, "oftentim": 117, "worri": 117, "coincid": 117, "earlier": 117, "array_equ": 117, "_render_fram": 117, "trivial": 117, "skeleton": 117, "set_mod": 117, "canva": 117, "pix_square_s": 117, "rect": 117, "gridlin": 117, "width": 117, "visibl": 117, "blit": 117, "get_rect": 117, "pump": 117, "delai": 117, "stabl": 117, "tick": 117, "surfarrai": 117, "pixels3d": 117, "bother": 117, "detect": 117, "put": 117, "registr": 117, "appropri": [117, 119], "entrypoint": 117, "mere": 117, "third": 117, "parti": 117, "codebas": 117, "edit": 117, "setuptool": 117, "install_requir": 117, "local": 117, "perfectli": 117, "fine": 117, "did": 118, "failur": 118, "notabl": 118, "inher": 118, "preserv": 118, "obviou": 118, "forev": 118, "forcibli": 118, "halt": 118, "formal": 118, "q_": 118, "o_t": 118, "a_t": 118, "r_t": 118, "max_a": 118, "o_": 118, "a_": 118, "q_target": 118, "distinct": 118, "frequent": 118, "differenti": 118, "vf_target": 118, "vf_next_stat": 118, "onward": 118, "handling_time_limit": 118, "scratch": 119, "earliest": 119, "gradient": 119, "burden": 119, "maxim": 119, "inverted_pendulum": 119, "1d": 119, "panda": 119, "pd": 119, "nn": 119, "rcparam": 119, "parameter": 119, "policy_network": 119, "obs_space_dim": 119, "action_space_dim": 119, "hidden_space1": 119, "feel": 119, "hidden_space2": 119, "shared_net": 119, "sequenti": 119, "policy_mean_net": 119, "std": 119, "policy_stddev_net": 119, "tensor": 119, "action_mean": 119, "action_stddev": 119, "shared_featur": 119, "exp": 119, "mention": 119, "fact": 119, "reinfroc": 119, "acronym": 119, "ward": 119, "ncrement": 119, "actor": 119, "o": 119, "ffset": 119, "einforc": 119, "haracterist": 119, "ligibl": 119, "tune": 119, "ep": 119, "mathemat": 119, "prob": 119, "adamw": 119, "sample_act": 119, "distrib": 119, "log_prob": 119, "running_g": 119, "delta": 119, "zip": 119, "zero_grad": 119, "centric": 119, "reiniti": 119, "fairli": 119, "brittl": 119, "spinningup": 119, "en": 119, "html": 119, "total_num_episod": 119, "5e3": 119, "rewards_over_se": 119, "fibonacci": 119, "manual_se": 119, "reward_over_episod": 119, "avg_reward": 119, "rewards_to_plot": 119, "df1": 119, "datafram": 119, "melt": 119, "renam": 119, "inplac": 119, "darkgrid": 119, "talk": 119, "palett": 119, "rainbow": 119, "lineplot": 119, "siddarth": 119, "chandrasekar": 119, "ronald": 119, "connectionist": 119, "machin": 119, "2004": 119, "229": 119, "256": 119, "reinforce_invpend_gym_v26": 119}, "objects": {"Space": [[9, 0, 1, "", "dtype"]], "": [[15, 1, 1, "", "action_space"], [15, 1, 1, "", "observation_space"], [15, 1, 1, "", "single_action_space"], [15, 1, 1, "", "single_observation_space"]], "gymnasium": [[17, 2, 1, "", "ActionWrapper"], [2, 2, 1, "", "Env"], [19, 2, 1, "", "ObservationWrapper"], [20, 2, 1, "", "RewardWrapper"], [16, 2, 1, "", "Wrapper"], [8, 3, 1, "", "make"], [8, 3, 1, "", "pprint_registry"], [8, 3, 1, "", "register"], [8, 3, 1, "", "spec"]], "gymnasium.ActionWrapper.ActionWrapper": [[17, 3, 1, "", "action"]], "gymnasium.Env": [[2, 1, 1, "", "action_space"], [2, 3, 1, "", "close"], [2, 1, 1, "", "metadata"], [2, 0, 1, "", "np_random"], [2, 1, 1, "", "observation_space"], [2, 3, 1, "", "render"], [2, 1, 1, "", "render_mode"], [2, 3, 1, "", "reset"], [2, 1, 1, "", "reward_range"], [2, 1, 1, "", "spec"], [2, 3, 1, "", "step"], [2, 0, 1, "", "unwrapped"]], "gymnasium.ObservationWrapper": [[19, 3, 1, "", "observation"]], "gymnasium.RewardWrapper.RewardWrapper": [[20, 3, 1, "", "reward"]], "gymnasium.Wrapper": [[16, 0, 1, "", "action_space"], [16, 3, 1, "", "close"], [16, 0, 1, "", "metadata"], [16, 0, 1, "", "np_random"], [16, 0, 1, "", "observation_space"], [16, 3, 1, "", "reset"], [16, 0, 1, "", "reward_range"], [16, 0, 1, "", "spec"], [16, 3, 1, "", "step"], [16, 0, 1, "", "unwrapped"]], "gymnasium.experimental": [[4, 2, 1, "", "FuncEnv"]], "gymnasium.experimental.FuncEnv": [[4, 3, 1, "id0", "initial"], [4, 3, 1, "id1", "observation"], [4, 3, 1, "", "render_close"], [4, 3, 1, "", "render_image"], [4, 3, 1, "", "render_init"], [4, 3, 1, "", "reward"], [4, 3, 1, "", "state_info"], [4, 3, 1, "", "step_info"], [4, 3, 1, "", "terminal"], [4, 3, 1, "", "transform"], [4, 3, 1, "", "transition"]], "gymnasium.experimental.wrappers": [[7, 2, 1, "", "ClipRewardV0"], [7, 2, 1, "", "LambdaActionV0"], [7, 2, 1, "", "LambdaObservationV0"], [7, 2, 1, "", "LambdaRewardV0"]], "gymnasium.spaces": [[11, 2, 1, "", "Box"], [10, 2, 1, "", "Dict"], [11, 2, 1, "", "Discrete"], [10, 2, 1, "", "Graph"], [11, 2, 1, "", "MultiBinary"], [11, 2, 1, "", "MultiDiscrete"], [10, 2, 1, "", "Sequence"], [9, 2, 1, "", "Space"], [11, 2, 1, "", "Text"], [10, 2, 1, "", "Tuple"]], "gymnasium.spaces.Box": [[11, 4, 1, "", "is_bounded"], [11, 4, 1, "", "sample"], [11, 4, 1, "", "seed"]], "gymnasium.spaces.Dict": [[10, 4, 1, "", "sample"], [10, 4, 1, "", "seed"]], "gymnasium.spaces.Discrete": [[11, 4, 1, "", "sample"], [11, 4, 1, "", "seed"]], "gymnasium.spaces.Graph": [[10, 4, 1, "", "sample"], [10, 4, 1, "", "seed"]], "gymnasium.spaces.MultiBinary": [[11, 4, 1, "", "sample"], [11, 4, 1, "", "seed"]], "gymnasium.spaces.MultiDiscrete": [[11, 4, 1, "", "sample"], [11, 4, 1, "", "seed"]], "gymnasium.spaces.Sequence": [[10, 4, 1, "", "sample"], [10, 4, 1, "", "seed"]], "gymnasium.spaces.Text": [[11, 4, 1, "", "sample"], [11, 4, 1, "", "seed"]], "gymnasium.spaces.Tuple": [[10, 4, 1, "", "sample"], [10, 4, 1, "", "seed"]], "gymnasium.spaces.space.Space": [[9, 3, 1, "", "contains"], [9, 3, 1, "", "from_jsonable"], [9, 3, 1, "", "sample"], [9, 3, 1, "", "seed"], [9, 0, 1, "", "shape"], [9, 3, 1, "", "to_jsonable"]], "gymnasium.spaces.utils": [[12, 3, 1, "", "flatdim"], [12, 3, 1, "", "flatten"], [12, 3, 1, "", "flatten_space"], [12, 3, 1, "", "unflatten"]], "gymnasium.utils.env_checker": [[14, 3, 1, "", "check_env"]], "gymnasium.utils.play": [[14, 2, 1, "", "PlayPlot"], [14, 2, 1, "", "PlayableGame"], [14, 3, 1, "", "play"]], "gymnasium.utils.play.PlayPlot": [[14, 4, 1, "", "callback"]], "gymnasium.utils.play.PlayableGame": [[14, 4, 1, "", "process_event"]], "gymnasium.utils.save_video": [[14, 3, 1, "", "capped_cubic_video_schedule"], [14, 3, 1, "", "save_video"]], "gymnasium.utils.seeding": [[14, 3, 1, "", "np_random"]], "gymnasium.utils.step_api_compatibility": [[14, 3, 1, "", "convert_to_done_step_api"], [14, 3, 1, "", "convert_to_terminated_truncated_step_api"], [14, 3, 1, "", "step_api_compatibility"]], "gymnasium.vector": [[15, 2, 1, "", "AsyncVectorEnv"], [15, 2, 1, "", "SyncVectorEnv"], [15, 2, 1, "", "VectorEnv"], [15, 3, 1, "", "make"]], "gymnasium.vector.VectorEnv": [[15, 4, 1, "", "close"], [15, 4, 1, "", "reset"], [15, 4, 1, "", "step"]], "gymnasium.vector.utils": [[13, 3, 1, "", "batch_space"], [13, 3, 1, "", "concatenate"], [13, 3, 1, "", "create_empty_array"], [13, 3, 1, "", "create_shared_memory"], [13, 3, 1, "", "iterate"], [13, 3, 1, "", "read_from_shared_memory"], [13, 3, 1, "", "write_to_shared_memory"]], "gymnasium.wrappers": [[18, 2, 1, "", "AtariPreprocessing"], [18, 2, 1, "", "AutoResetWrapper"], [17, 2, 1, "", "ClipAction"], [18, 2, 1, "", "EnvCompatibility"], [19, 2, 1, "", "FilterObservation"], [19, 2, 1, "", "FlattenObservation"], [19, 2, 1, "", "FrameStack"], [19, 2, 1, "", "GrayScaleObservation"], [18, 2, 1, "", "HumanRendering"], [19, 2, 1, "", "NormalizeObservation"], [20, 2, 1, "", "NormalizeReward"], [18, 2, 1, "", "OrderEnforcing"], [18, 2, 1, "", "PassiveEnvChecker"], [19, 2, 1, "", "PixelObservationWrapper"], [18, 2, 1, "", "RecordEpisodeStatistics"], [18, 2, 1, "", "RecordVideo"], [18, 2, 1, "", "RenderCollection"], [17, 2, 1, "", "RescaleAction"], [19, 2, 1, "", "ResizeObservation"], [18, 2, 1, "", "StepAPICompatibility"], [19, 2, 1, "", "TimeAwareObservation"], [18, 2, 1, "", "TimeLimit"], [19, 2, 1, "", "TransformObservation"], [20, 2, 1, "", "TransformReward"], [18, 2, 1, "", "VectorListInfo"]]}, "objtypes": {"0": "py:property", "1": "py:attribute", "2": "py:class", "3": "py:function", "4": "py:method"}, "objnames": {"0": ["py", "property", "Python property"], "1": ["py", "attribute", "Python attribute"], "2": ["py", "class", "Python class"], "3": ["py", "function", "Python function"], "4": ["py", "method", "Python method"]}, "titleterms": {"404": 0, "page": [0, 1], "Not": 0, "found": 0, "The": 0, "request": 0, "could": 0, "gymnasium": [1, 2, 4, 5, 15, 16, 115, 117], "doc": 1, "instruct": 1, "modifi": [1, 21], "environ": [1, 2, 3, 4, 5, 6, 8, 14, 15, 18, 21, 22, 23, 109, 115, 116, 117], "edit": 1, "an": [1, 116, 119], "ad": 1, "new": [1, 14], "atari": [1, 18, 24, 43], "env": [1, 2, 15, 109, 117], "non": 1, "other": [1, 109], "step": [1, 14, 22, 23, 117], "build": [1, 116, 119], "document": 1, "write": 1, "tutori": 1, "method": [2, 9, 15, 16], "attribut": [2, 9, 15, 16], "addit": 2, "implement": [2, 16], "experiment": [3, 4, 5], "function": [3, 4], "wrapper": [3, 6, 7, 16, 17, 18, 19, 20, 117], "lambda": [3, 6, 7], "observ": [3, 6, 7, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116, 117], "action": [3, 6, 7, 17, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116], "reward": [3, 6, 7, 20, 24, 27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "common": [3, 6, 7, 24], "vector": [3, 5, 6, 9, 13, 15, 18], "onli": [3, 6], "funcenv": 4, "func2env": 4, "functionaljaxcompatibilityenv": 4, "vectorenv": [5, 15], "asyncvectorenv": 5, "syncvectorenv": 5, "custom": [5, 16, 117], "envpool": 5, "registri": 8, "make": [8, 15, 117], "regist": [8, 117], "all": 8, "spec": 8, "pretti": 8, "print": 8, "space": [9, 10, 11, 12, 13, 21, 24, 50, 51, 52, 53, 54, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "fundament": [9, 11], "composit": [9, 10], "util": [9, 12, 13, 14], "dict": 10, "tupl": 10, "sequenc": 10, "graph": 10, "box": [11, 38], "discret": [11, 109], "multibinari": 11, "multidiscret": 11, "text": [11, 110], "share": 13, "memori": 13, "visual": [14, 116], "save": 14, "render": [14, 18, 23, 117], "video": [14, 18, 84, 109], "old": 14, "api": [14, 22, 115], "compat": [14, 18, 22], "seed": [14, 23], "check": 14, "async": 15, "sync": 15, "clip": 17, "rescal": 17, "misc": 18, "preprocess": 18, "autoreset": 18, "passiv": 18, "checker": 18, "human": 18, "order": 18, "enforc": 18, "record": 18, "episod": [18, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "statist": 18, "collect": [18, 115], "time": [18, 19, 118], "limit": [18, 118], "list": [18, 43], "info": 18, "transform": [19, 20], "filter": 19, "flatten": 19, "framestack": 19, "grai": 19, "scale": 19, "normal": [19, 20], "pixel": 19, "resiz": 19, "awar": 19, "basic": 21, "usag": 21, "initi": [21, 117], "interact": 21, "explain": 21, "code": [21, 23, 118], "more": 21, "inform": [21, 111, 112, 113, 114], "gym": [22, 109], "load": 22, "openai": [22, 109], "v0": 22, "22": 22, "v21": 23, "v26": 23, "migrat": 23, "guid": 23, "exampl": 23, "random": 23, "number": 23, "gener": 23, "reset": [23, 89, 117], "remov": 23, "autorom": 24, "instal": 24, "rom": 24, "stochast": 24, "argument": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "version": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114], "histori": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "name": [24, 64], "scheme": 24, "flavor": 24, "refer": [24, 89, 92, 111, 112, 114, 115, 119], "adventur": 25, "descript": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "air": 26, "raid": 26, "alien": 27, "amidar": 28, "assault": 29, "asterix": 30, "asteroid": 31, "atlanti": 32, "bank": 33, "heist": 33, "battl": 34, "zone": 34, "beam": 35, "rider": 35, "berzerk": 36, "bowl": 37, "breakout": 39, "carniv": 40, "centiped": 41, "chopper": 42, "command": 42, "complet": 43, "crazi": 44, "climber": 44, "defend": 45, "demon": 46, "attack": 46, "doubl": [47, 103], "dunk": 47, "elev": 48, "enduro": 49, "fishingderbi": 50, "freewai": 51, "frostbit": 52, "gopher": 53, "gravitar": 54, "hero": 55, "icehockei": 56, "jamesbond": 57, "journeyescap": 58, "kangaroo": 59, "krull": 60, "kung": 61, "fu": 61, "master": 61, "montezuma": 62, "reveng": 62, "m": 63, "pacman": 63, "thi": 64, "game": [64, 109], "phoenix": 65, "pitfal": 66, "pong": 67, "pooyan": 68, "privateey": 69, "qbert": 70, "riverraid": 71, "road": 72, "runner": 72, "robot": [73, 109], "tank": 73, "seaquest": 74, "ski": 75, "solari": 76, "spaceinvad": 77, "stargunn": 78, "tenni": 79, "timepilot": 80, "tutankham": 81, "up": 82, "n": 82, "down": 82, "ventur": 83, "pinbal": 84, "wizard": 85, "wor": 85, "zaxxon": 86, "box2d": 87, "biped": 88, "walker": 88, "start": [88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "state": [88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 117], "termin": [88, 89, 90, 118], "credit": [88, 89, 90], "car": [89, 94, 95], "race": [89, 109], "lunar": 90, "lander": 90, "classic": [91, 109], "control": [91, 109], "acrobot": 92, "end": [92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "cart": 93, "pole": 93, "mountain": [94, 95], "transit": [94, 95], "dynam": [94, 95, 109], "continu": 95, "pendulum": [96, 103, 104], "truncat": [96, 118], "mujoco": [97, 119], "ant": 98, "half": 99, "cheetah": 99, "hopper": 100, "humanoid": [101, 102], "standup": 102, "invert": [103, 104], "pusher": 105, "reacher": 106, "swimmer": 107, "note": 107, "walker2d": 108, "third": 109, "parti": 109, "stabl": 109, "retro": 109, "maintain": 109, "flappi": 109, "bird": 109, "A": 109, "derk": 109, "gpu": 109, "acceler": 109, "moba": 109, "slimevolleygym": 109, "simpl": 109, "singl": 109, "multi": 109, "agent": [109, 116, 119], "reinforc": [109, 115, 119], "learn": [109, 115, 116, 118, 119], "uniti": 109, "ml": 109, "engin": 109, "pge": 109, "parallel": 109, "jimini": 109, "train": [109, 116, 119], "pybullet": 109, "drone": 109, "quadcopt": 109, "marsexplor": 109, "mar": 109, "panda": 109, "us": [109, 117, 119], "physic": 109, "robo": 109, "real": 109, "world": 109, "simul": 109, "offworld": 109, "safe": 109, "softrobot": 109, "soft": 109, "igibson": 109, "dexteroushand": 109, "dual": 109, "dexter": 109, "hand": 109, "manipul": 109, "task": 109, "omniisaacgymenv": 109, "autonom": 109, "drive": 109, "sumo": 109, "rl": 109, "duckietown": 109, "electr": 109, "motor": 109, "highwai": 109, "commonroad": 109, "tmrl": 109, "trackmania": 109, "2020": 109, "through": 109, "racing_dream": 109, "l2r": 109, "multimod": 109, "where": 109, "how": 109, "racecar_gym": 109, "compilergym": 109, "optimis": 109, "compil": 109, "carl": 109, "context": 109, "adapt": 109, "matrix": 109, "mdp": 109, "easili": 109, "creat": [109, 117], "mo": 109, "object": 109, "cellular": 109, "automata": 109, "sokoban": 109, "2d": 109, "transport": 109, "puzzl": 109, "dacbench": 109, "benchmark": 109, "librari": 109, "algorithm": 109, "configur": 109, "nlpgym": 109, "toolkit": 109, "develop": 109, "solv": [109, 116], "nlp": 109, "satur": 109, "prove": 109, "theorem": 109, "shinrl": 109, "evalu": 109, "gymnax": 109, "hardwar": 109, "anytrad": 109, "financi": 109, "trade": 109, "forex": 109, "stock": 109, "mtsim": 109, "metatrad": 109, "5": 109, "platform": 109, "openmodelica": 109, "microgrid": 109, "power": 109, "electron": 109, "convert": 109, "mobil": 109, "coordin": 109, "wireless": 109, "network": [109, 119], "gymfc": 109, "flight": 109, "tune": 109, "framework": 109, "toi": 110, "blackjack": [111, 116], "cliff": 112, "walk": 112, "frozen": 113, "lake": 113, "taxi": 114, "i": 115, "standard": 115, "divers": 115, "q": 116, "import": [116, 118], "setup": 116, "execut": 116, "visualis": 116, "polici": [116, 119], "think": 116, "you": 116, "can": 116, "do": 116, "better": 116, "your": 117, "own": 117, "subclass": 117, "declar": 117, "construct": 117, "from": 117, "close": 117, "packag": 117, "instanc": 117, "handl": 118, "solut": 118, "plot": 119, "curv": 119}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 8, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx": 57}, "alltitles": {"404 - Page Not Found": [[0, "page-not-found"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Gymnasium-docs": [[1, "gymnasium-docs"]], "Instructions for modifying environment pages": [[1, "instructions-for-modifying-environment-pages"]], "Editing an environment page": [[1, "editing-an-environment-page"]], "Adding a new environment": [[1, "adding-a-new-environment"]], "Atari env": [[1, "atari-env"]], "Non-Atari env": [[1, "non-atari-env"]], "Other steps": [[1, "other-steps"]], "Build the Documentation": [[1, "build-the-documentation"]], "Writing Tutorials": [[1, "writing-tutorials"]], "Env": [[2, "env"]], "gymnasium.Env": [[2, "gymnasium-env"]], "Methods": [[2, "methods"], [9, "methods"], [15, "methods"], [16, "methods"]], "Attributes": [[2, "attributes"], [9, "attributes"], [15, "attributes"], [16, "attributes"]], "Additional Methods": [[2, "additional-methods"]], "Implementing environments": [[2, "implementing-environments"]], "Experimental": [[3, "experimental"]], "Functional Environments": [[3, "functional-environments"]], "Wrappers": [[3, "wrappers"], [7, "wrappers"], [16, "wrappers"]], "Lambda Observation Wrappers": [[3, "lambda-observation-wrappers"], [7, "lambda-observation-wrappers"]], "Lambda Action Wrappers": [[3, "lambda-action-wrappers"], [7, "lambda-action-wrappers"]], "Lambda Reward Wrappers": [[3, "lambda-reward-wrappers"], [7, "lambda-reward-wrappers"]], "Common Wrappers": [[3, "common-wrappers"], [7, "common-wrappers"]], "Vector Only Wrappers": [[3, "vector-only-wrappers"], [6, "vector-only-wrappers"]], "Vector Environment": [[3, "vector-environment"]], "Wrappers for Vector Environments": [[3, "wrappers-for-vector-environments"]], "Functional Environment": [[4, "functional-environment"]], "gymnasium.experimental.FuncEnv": [[4, "gymnasium-experimental-funcenv"]], "gymnasium.experimental.func2env.FunctionalJaxCompatibilityEnv": [[4, "gymnasium-experimental-func2env-functionaljaxcompatibilityenv"]], "Vectorizing Environment": [[5, "vectorizing-environment"]], "gymnasium.experimental.VectorEnv": [[5, "gymnasium-experimental-vectorenv"]], "gymnasium.experimental.vector.AsyncVectorEnv": [[5, "gymnasium-experimental-vector-asyncvectorenv"]], "gymnasium.experimental.vector.SyncVectorEnv": [[5, "gymnasium-experimental-vector-syncvectorenv"]], "Custom Vector environments": [[5, "custom-vector-environments"]], "EnvPool": [[5, "envpool"]], "Vector Environment Wrappers": [[6, "vector-environment-wrappers"]], "Vector Lambda Observation Wrappers": [[6, "vector-lambda-observation-wrappers"]], "Vector Lambda Action Wrappers": [[6, "vector-lambda-action-wrappers"]], "Vector Lambda Reward Wrappers": [[6, "vector-lambda-reward-wrappers"]], "Vector Common Wrappers": [[6, "vector-common-wrappers"]], "Registry": [[8, "registry"]], "Make": [[8, "make"]], "Register": [[8, "register"]], "All registered environments": [[8, "all-registered-environments"]], "Spec": [[8, "spec"]], "Pretty print registry": [[8, "pretty-print-registry"]], "Spaces": [[9, "spaces"]], "Fundamental Spaces": [[9, "fundamental-spaces"], [11, "fundamental-spaces"]], "Composite Spaces": [[9, "composite-spaces"], [10, "composite-spaces"]], "Utils": [[9, "utils"], [14, "utils"]], "Vector Utils": [[9, "vector-utils"]], "Dict": [[10, "dict"]], "Tuple": [[10, "tuple"]], "Sequence": [[10, "sequence"]], "Graph": [[10, "graph"]], "Box": [[11, "box"]], "Discrete": [[11, "discrete"]], "MultiBinary": [[11, "multibinary"]], "MultiDiscrete": [[11, "multidiscrete"]], "Text": [[11, "text"]], "Spaces Utils": [[12, "spaces-utils"]], "Spaces Vector Utils": [[13, "spaces-vector-utils"]], "Shared Memory Utils": [[13, "shared-memory-utils"]], "Visualization": [[14, "visualization"]], "Save Rendering Videos": [[14, "save-rendering-videos"]], "Old to New Step API Compatibility": [[14, "old-to-new-step-api-compatibility"]], "Seeding": [[14, "seeding"]], "Environment Checking": [[14, "environment-checking"]], "Vector": [[15, "vector"]], "Gymnasium.vector.VectorEnv": [[15, "gymnasium-vector-vectorenv"]], "Making Vector Environments": [[15, "making-vector-environments"]], "Async Vector Env": [[15, "async-vector-env"]], "Sync Vector Env": [[15, "sync-vector-env"]], "gymnasium.Wrapper": [[16, "gymnasium-wrapper"]], "Gymnasium Wrappers": [[16, "gymnasium-wrappers"]], "Implementing a custom wrapper": [[16, "implementing-a-custom-wrapper"]], "Action Wrappers": [[17, "action-wrappers"]], "Action Wrapper": [[17, "action-wrapper"]], "Clip Action": [[17, "clip-action"]], "Rescale Action": [[17, "rescale-action"]], "Misc Wrappers": [[18, "misc-wrappers"]], "Atari Preprocessing": [[18, "atari-preprocessing"]], "Autoreset": [[18, "autoreset"]], "Compatibility": [[18, "compatibility"]], "Passive Environment Checker": [[18, "passive-environment-checker"]], "Human Rendering": [[18, "human-rendering"]], "Order Enforcing": [[18, "order-enforcing"]], "Record Episode Statistics": [[18, "record-episode-statistics"]], "Record Video": [[18, "record-video"]], "Render Collection": [[18, "render-collection"]], "Time Limit": [[18, "time-limit"]], "Vector List Info": [[18, "vector-list-info"]], "Observation Wrappers": [[19, "observation-wrappers"]], "Observation Wrapper": [[19, "observation-wrapper"]], "Transform Observation": [[19, "transform-observation"]], "Filter Observation": [[19, "filter-observation"]], "Flatten Observation": [[19, "flatten-observation"]], "Framestack Observations": [[19, "framestack-observations"]], "Gray Scale Observation": [[19, "gray-scale-observation"]], "Normalize Observation": [[19, "normalize-observation"]], "Pixel Observation Wrapper": [[19, "pixel-observation-wrapper"]], "Resize Observation": [[19, "resize-observation"]], "Time Aware Observation": [[19, "time-aware-observation"]], "Reward Wrappers": [[20, "reward-wrappers"]], "Reward Wrapper": [[20, "reward-wrapper"]], "Transform Reward": [[20, "transform-reward"]], "Normalize Reward": [[20, "normalize-reward"]], "Basic Usage": [[21, "basic-usage"]], "Initializing Environments": [[21, "initializing-environments"]], "Interacting with the Environment": [[21, "interacting-with-the-environment"]], "Explaining the code": [[21, "explaining-the-code"]], "Action and observation spaces": [[21, "action-and-observation-spaces"]], "Modifying the environment": [[21, "modifying-the-environment"]], "More information": [[21, "more-information"]], "Compatibility with Gym": [[22, "compatibility-with-gym"]], "Loading OpenAI Gym environments": [[22, "loading-openai-gym-environments"]], "Gym v0.22 Environment Compatibility": [[22, "gym-v0-22-environment-compatibility"]], "Step API Compatibility": [[22, "step-api-compatibility"]], "v21 to v26 Migration Guide": [[23, "v21-to-v26-migration-guide"]], "Example code for v21": [[23, "example-code-for-v21"]], "Example code for v26": [[23, "example-code-for-v26"]], "Seed and random number generator": [[23, "seed-and-random-number-generator"]], "Environment Reset": [[23, "environment-reset"]], "Environment Step": [[23, "environment-step"]], "Environment Render": [[23, "environment-render"]], "Removed code": [[23, "removed-code"]], "Atari": [[24, "atari"]], "AutoROM (installing the ROMs)": [[24, "autorom-installing-the-roms"]], "Action Space": [[24, "action-space"], [50, "action-space"], [51, "action-space"], [52, "action-space"], [53, "action-space"], [54, "action-space"], [88, "action-space"], [89, "action-space"], [90, "action-space"], [92, "action-space"], [93, "action-space"], [94, "action-space"], [95, "action-space"], [96, "action-space"], [98, "action-space"], [99, "action-space"], [100, "action-space"], [101, "action-space"], [102, "action-space"], [103, "action-space"], [104, "action-space"], [105, "action-space"], [106, "action-space"], [107, "action-space"], [108, "action-space"], [111, "action-space"], [112, "action-space"], [113, "action-space"], [114, "action-space"]], "Observation Space": [[24, "observation-space"], [88, "observation-space"], [89, "observation-space"], [90, "observation-space"], [92, "observation-space"], [93, "observation-space"], [94, "observation-space"], [95, "observation-space"], [96, "observation-space"], [98, "observation-space"], [99, "observation-space"], [100, "observation-space"], [101, "observation-space"], [102, "observation-space"], [103, "observation-space"], [104, "observation-space"], [105, "observation-space"], [106, "observation-space"], [107, "observation-space"], [108, "observation-space"], [111, "observation-space"], [112, "observation-space"], [113, "observation-space"], [114, "observation-space"]], "Rewards": [[24, "rewards"], [27, "rewards"], [28, "rewards"], [30, "rewards"], [31, "rewards"], [32, "rewards"], [33, "rewards"], [34, "rewards"], [35, "rewards"], [36, "rewards"], [37, "rewards"], [38, "rewards"], [39, "rewards"], [40, "rewards"], [41, "rewards"], [42, "rewards"], [44, "rewards"], [45, "rewards"], [46, "rewards"], [47, "rewards"], [48, "rewards"], [49, "rewards"], [50, "rewards"], [51, "rewards"], [52, "rewards"], [53, "rewards"], [54, "rewards"], [55, "rewards"], [56, "rewards"], [57, "rewards"], [58, "rewards"], [59, "rewards"], [60, "rewards"], [66, "rewards"], [67, "rewards"], [68, "rewards"], [69, "rewards"], [70, "rewards"], [71, "rewards"], [72, "rewards"], [73, "rewards"], [74, "rewards"], [75, "rewards"], [76, "rewards"], [77, "rewards"], [78, "rewards"], [79, "rewards"], [80, "rewards"], [88, "rewards"], [89, "rewards"], [90, "rewards"], [92, "rewards"], [93, "rewards"], [96, "rewards"], [98, "rewards"], [99, "rewards"], [100, "rewards"], [101, "rewards"], [102, "rewards"], [103, "rewards"], [104, "rewards"], [105, "rewards"], [106, "rewards"], [107, "rewards"], [108, "rewards"], [111, "rewards"], [113, "rewards"], [114, "rewards"]], "Stochasticity": [[24, "stochasticity"]], "Common Arguments": [[24, "common-arguments"]], "Version History and Naming Schemes": [[24, "version-history-and-naming-schemes"]], "Flavors": [[24, "flavors"]], "References": [[24, "references"], [89, "references"], [92, "references"], [111, "references"], [112, "references"], [114, "references"], [119, "references"]], "Adventure": [[25, "adventure"]], "Description": [[25, "description"], [26, "description"], [27, "description"], [28, "description"], [29, "description"], [30, "description"], [31, "description"], [32, "description"], [33, "description"], [34, "description"], [35, "description"], [36, "description"], [37, "description"], [38, "description"], [39, "description"], [40, "description"], [41, "description"], [42, "description"], [44, "description"], [45, "description"], [46, "description"], [47, "description"], [48, "description"], [49, "description"], [50, "description"], [51, "description"], [52, "description"], [53, "description"], [54, "description"], [55, "description"], [56, "description"], [57, "description"], [58, "description"], [59, "description"], [60, "description"], [61, "description"], [62, "description"], [63, "description"], [64, "description"], [65, "description"], [66, "description"], [67, "description"], [68, "description"], [69, "description"], [70, "description"], [71, "description"], [72, "description"], [73, "description"], [74, "description"], [75, "description"], [76, "description"], [77, "description"], [78, "description"], [79, "description"], [80, "description"], [81, "description"], [82, "description"], [83, "description"], [84, "description"], [85, "description"], [86, "description"], [88, "description"], [89, "description"], [90, "description"], [92, "description"], [93, "description"], [94, "description"], [95, "description"], [96, "description"], [98, "description"], [99, "description"], [100, "description"], [101, "description"], [102, "description"], [103, "description"], [104, "description"], [105, "description"], [106, "description"], [107, "description"], [108, "description"], [111, "description"], [112, "description"], [113, "description"], [114, "description"]], "Actions": [[25, "actions"], [26, "actions"], [27, "actions"], [28, "actions"], [29, "actions"], [30, "actions"], [31, "actions"], [32, "actions"], [33, "actions"], [34, "actions"], [35, "actions"], [36, "actions"], [37, "actions"], [38, "actions"], [39, "actions"], [40, "actions"], [41, "actions"], [42, "actions"], [44, "actions"], [45, "actions"], [46, "actions"], [47, "actions"], [48, "actions"], [49, "actions"], [55, "actions"], [56, "actions"], [57, "actions"], [58, "actions"], [59, "actions"], [60, "actions"], [61, "actions"], [62, "actions"], [63, "actions"], [64, "actions"], [65, "actions"], [66, "actions"], [67, "actions"], [68, "actions"], [69, "actions"], [70, "actions"], [71, "actions"], [72, "actions"], [73, "actions"], [74, "actions"], [75, "actions"], [76, "actions"], [77, "actions"], [78, "actions"], [79, "actions"], [80, "actions"], [81, "actions"], [82, "actions"], [83, "actions"], [84, "actions"], [85, "actions"], [86, "actions"]], "Observations": [[25, "observations"], [26, "observations"], [27, "observations"], [28, "observations"], [29, "observations"], [30, "observations"], [31, "observations"], [32, "observations"], [33, "observations"], [34, "observations"], [35, "observations"], [36, "observations"], [37, "observations"], [38, "observations"], [39, "observations"], [40, "observations"], [41, "observations"], [42, "observations"], [44, "observations"], [45, "observations"], [46, "observations"], [47, "observations"], [48, "observations"], [49, "observations"], [50, "observations"], [51, "observations"], [52, "observations"], [53, "observations"], [54, "observations"], [55, "observations"], [56, "observations"], [57, "observations"], [58, "observations"], [59, "observations"], [60, "observations"], [61, "observations"], [62, "observations"], [63, "observations"], [64, "observations"], [65, "observations"], [66, "observations"], [67, "observations"], [68, "observations"], [69, "observations"], [70, "observations"], [71, "observations"], [72, "observations"], [73, "observations"], [74, "observations"], [75, "observations"], [76, "observations"], [77, "observations"], [78, "observations"], [79, "observations"], [80, "observations"], [81, "observations"], [82, "observations"], [83, "observations"], [84, "observations"], [85, "observations"], [86, "observations"]], "Arguments": [[25, "arguments"], [26, "arguments"], [27, "arguments"], [28, "arguments"], [29, "arguments"], [30, "arguments"], [31, "arguments"], [32, "arguments"], [33, "arguments"], [34, "arguments"], [35, "arguments"], [36, "arguments"], [37, "arguments"], [38, "arguments"], [39, "arguments"], [40, "arguments"], [41, "arguments"], [42, "arguments"], [44, "arguments"], [45, "arguments"], [46, "arguments"], [47, "arguments"], [48, "arguments"], [49, "arguments"], [50, "arguments"], [51, "arguments"], [52, "arguments"], [53, "arguments"], [54, "arguments"], [55, "arguments"], [56, "arguments"], [57, "arguments"], [58, "arguments"], [59, "arguments"], [60, "arguments"], [61, "arguments"], [62, "arguments"], [63, "arguments"], [64, "arguments"], [65, "arguments"], [66, "arguments"], [67, "arguments"], [68, "arguments"], [69, "arguments"], [70, "arguments"], [71, "arguments"], [72, "arguments"], [73, "arguments"], [74, "arguments"], [75, "arguments"], [76, "arguments"], [77, "arguments"], [78, "arguments"], [79, "arguments"], [80, "arguments"], [81, "arguments"], [82, "arguments"], [83, "arguments"], [84, "arguments"], [85, "arguments"], [86, "arguments"], [88, "arguments"], [89, "arguments"], [90, "arguments"], [92, "arguments"], [93, "arguments"], [94, "arguments"], [95, "arguments"], [96, "arguments"], [98, "arguments"], [99, "arguments"], [100, "arguments"], [101, "arguments"], [102, "arguments"], [103, "arguments"], [104, "arguments"], [105, "arguments"], [106, "arguments"], [107, "arguments"], [108, "arguments"], [111, "arguments"], [112, "arguments"], [113, "arguments"], [114, "arguments"]], "Version History": [[25, "version-history"], [26, "version-history"], [27, "version-history"], [28, "version-history"], [29, "version-history"], [30, "version-history"], [31, "version-history"], [32, "version-history"], [33, "version-history"], [34, "version-history"], [35, "version-history"], [36, "version-history"], [37, "version-history"], [38, "version-history"], [39, "version-history"], [40, "version-history"], [41, "version-history"], [42, "version-history"], [44, "version-history"], [45, "version-history"], [46, "version-history"], [47, "version-history"], [48, "version-history"], [49, "version-history"], [50, "version-history"], [51, "version-history"], [52, "version-history"], [53, "version-history"], [54, "version-history"], [55, "version-history"], [56, "version-history"], [57, "version-history"], [58, "version-history"], [59, "version-history"], [60, "version-history"], [61, "version-history"], [62, "version-history"], [63, "version-history"], [64, "version-history"], [65, "version-history"], [66, "version-history"], [67, "version-history"], [68, "version-history"], [69, "version-history"], [70, "version-history"], [71, "version-history"], [72, "version-history"], [73, "version-history"], [74, "version-history"], [75, "version-history"], [76, "version-history"], [77, "version-history"], [78, "version-history"], [79, "version-history"], [80, "version-history"], [81, "version-history"], [82, "version-history"], [83, "version-history"], [84, "version-history"], [85, "version-history"], [86, "version-history"], [88, "version-history"], [89, "version-history"], [90, "version-history"], [92, "version-history"], [94, "version-history"], [95, "version-history"], [96, "version-history"], [98, "version-history"], [99, "version-history"], [100, "version-history"], [101, "version-history"], [102, "version-history"], [103, "version-history"], [104, "version-history"], [105, "version-history"], [106, "version-history"], [107, "version-history"], [108, "version-history"], [111, "version-history"], [112, "version-history"], [113, "version-history"], [114, "version-history"]], "Air Raid": [[26, "air-raid"]], "Alien": [[27, "alien"]], "Amidar": [[28, "amidar"]], "Assault": [[29, "assault"]], "Asterix": [[30, "asterix"]], "Asteroids": [[31, "asteroids"]], "Atlantis": [[32, "atlantis"]], "Bank Heist": [[33, "bank-heist"]], "Battle Zone": [[34, "battle-zone"]], "Beam Rider": [[35, "beam-rider"]], "Berzerk": [[36, "berzerk"]], "Bowling": [[37, "bowling"]], "Boxing": [[38, "boxing"]], "Breakout": [[39, "breakout"]], "Carnival": [[40, "carnival"]], "Centipede": [[41, "centipede"]], "Chopper Command": [[42, "chopper-command"]], "Complete List - Atari": [[43, "complete-list-atari"]], "Crazy Climber": [[44, "crazy-climber"]], "Defender": [[45, "defender"]], "Demon Attack": [[46, "demon-attack"]], "Double Dunk": [[47, "double-dunk"]], "Elevator Action": [[48, "elevator-action"]], "Enduro": [[49, "enduro"]], "FishingDerby": [[50, "fishingderby"]], "Freeway": [[51, "freeway"]], "Frostbite": [[52, "frostbite"]], "Gopher": [[53, "gopher"]], "Gravitar": [[54, "gravitar"]], "Hero": [[55, "hero"]], "IceHockey": [[56, "icehockey"]], "Jamesbond": [[57, "jamesbond"]], "JourneyEscape": [[58, "journeyescape"]], "Kangaroo": [[59, "kangaroo"]], "Krull": [[60, "krull"]], "Kung Fu Master": [[61, "kung-fu-master"]], "Montezuma Revenge": [[62, "montezuma-revenge"]], "Ms Pacman": [[63, "ms-pacman"]], "Name This Game": [[64, "name-this-game"]], "Phoenix": [[65, "phoenix"]], "Pitfall": [[66, "pitfall"]], "Pong": [[67, "pong"]], "Pooyan": [[68, "pooyan"]], "PrivateEye": [[69, "privateeye"]], "Qbert": [[70, "qbert"]], "Riverraid": [[71, "riverraid"]], "Road Runner": [[72, "road-runner"]], "Robot Tank": [[73, "robot-tank"]], "Seaquest": [[74, "seaquest"]], "Skiings": [[75, "skiings"]], "Solaris": [[76, "solaris"]], "SpaceInvaders": [[77, "spaceinvaders"]], "StarGunner": [[78, "stargunner"]], "Tennis": [[79, "tennis"]], "TimePilot": [[80, "timepilot"]], "Tutankham": [[81, "tutankham"]], "Up n\u2019 Down": [[82, "up-n-down"]], "Venture": [[83, "venture"]], "Video Pinball": [[84, "video-pinball"]], "Wizard of Wor": [[85, "wizard-of-wor"]], "Zaxxon": [[86, "zaxxon"]], "Box2D": [[87, "box2d"]], "Bipedal Walker": [[88, "bipedal-walker"]], "Starting State": [[88, "starting-state"], [89, "starting-state"], [90, "starting-state"], [92, "starting-state"], [93, "starting-state"], [94, "starting-state"], [95, "starting-state"], [96, "starting-state"], [98, "starting-state"], [99, "starting-state"], [100, "starting-state"], [101, "starting-state"], [102, "starting-state"], [103, "starting-state"], [104, "starting-state"], [105, "starting-state"], [106, "starting-state"], [107, "starting-state"], [108, "starting-state"], [111, "starting-state"], [112, "starting-state"], [113, "starting-state"], [114, "starting-state"]], "Episode Termination": [[88, "episode-termination"], [89, "episode-termination"], [90, "episode-termination"]], "Credits": [[88, "credits"], [89, "credits"], [90, "credits"]], "Car Racing": [[89, "car-racing"]], "Reset Arguments": [[89, "reset-arguments"]], "Lunar Lander": [[90, "lunar-lander"]], "Classic Control": [[91, "classic-control"]], "Acrobot": [[92, "acrobot"]], "Episode End": [[92, "episode-end"], [93, "episode-end"], [94, "episode-end"], [95, "episode-end"], [98, "episode-end"], [99, "episode-end"], [100, "episode-end"], [101, "episode-end"], [102, "episode-end"], [103, "episode-end"], [104, "episode-end"], [105, "episode-end"], [106, "episode-end"], [107, "episode-end"], [108, "episode-end"], [111, "episode-end"], [112, "episode-end"], [113, "episode-end"], [114, "episode-end"]], "Cart Pole": [[93, "cart-pole"]], "Mountain Car": [[94, "mountain-car"]], "Transition Dynamics:": [[94, "transition-dynamics"], [95, "transition-dynamics"]], "Reward:": [[94, "reward"]], "Mountain Car Continuous": [[95, "mountain-car-continuous"]], "Reward": [[95, "reward"], [112, "reward"]], "Pendulum": [[96, "pendulum"]], "Episode Truncation": [[96, "episode-truncation"]], "MuJoCo": [[97, "mujoco"]], "Ant": [[98, "ant"]], "Half Cheetah": [[99, "half-cheetah"]], "Hopper": [[100, "hopper"]], "Humanoid": [[101, "humanoid"]], "Humanoid Standup": [[102, "humanoid-standup"]], "Inverted Double Pendulum": [[103, "inverted-double-pendulum"]], "Inverted Pendulum": [[104, "inverted-pendulum"]], "Pusher": [[105, "pusher"]], "Reacher": [[106, "reacher"]], "Swimmer": [[107, "swimmer"]], "Notes": [[107, "notes"]], "Walker2D": [[108, "walker2d"]], "Third-party Environments": [[109, "third-party-environments"]], "Video Game environments": [[109, "video-game-environments"]], "stable-retro: Classic retro games, a maintained version of OpenAI Retro": [[109, "stable-retro-classic-retro-games-a-maintained-version-of-openai-retro"]], "flappy-bird-gym: A Flappy Bird environment for Gym": [[109, "flappy-bird-gym-a-flappy-bird-environment-for-gym"]], "gym-derk: GPU accelerated MOBA environment": [[109, "gym-derk-gpu-accelerated-moba-environment"]], "SlimeVolleyGym: A simple environment for single and multi-agent reinforcement learning": [[109, "slimevolleygym-a-simple-environment-for-single-and-multi-agent-reinforcement-learning"]], "Unity ML Agents: Environments for Unity game engine": [[109, "unity-ml-agents-environments-for-unity-game-engine"]], "PGE: Parallel Game Engine": [[109, "pge-parallel-game-engine"]], "Robotics environments": [[109, "robotics-environments"]], "gym-jiminy: Training Robots in Jiminy": [[109, "gym-jiminy-training-robots-in-jiminy"]], "gym-pybullet-drones: Environments for quadcopter control": [[109, "gym-pybullet-drones-environments-for-quadcopter-control"]], "MarsExplorer: Environments for controlling robot on Mars": [[109, "marsexplorer-environments-for-controlling-robot-on-mars"]], "panda-gym: Robotics environments using the PyBullet physics engine": [[109, "panda-gym-robotics-environments-using-the-pybullet-physics-engine"]], "robo-gym: Real-world and simulation robotics": [[109, "robo-gym-real-world-and-simulation-robotics"]], "Offworld-gym": [[109, "offworld-gym"]], "safe-control-gym": [[109, "safe-control-gym"]], "gym-softrobot: Soft-robotics environments": [[109, "gym-softrobot-soft-robotics-environments"]], "iGibson": [[109, "igibson"]], "DexterousHands: dual dexterous hand manipulation tasks": [[109, "dexteroushands-dual-dexterous-hand-manipulation-tasks"]], "OmniIsaacGymEnvs": [[109, "omniisaacgymenvs"]], "Autonomous Driving environments": [[109, "autonomous-driving-environments"]], "sumo-rl": [[109, "sumo-rl"]], "gym-duckietown": [[109, "gym-duckietown"]], "gym-electric-motor": [[109, "gym-electric-motor"]], "highway-env": [[109, "highway-env"]], "CommonRoad-RL": [[109, "commonroad-rl"]], "tmrl: TrackMania 2020 through RL": [[109, "tmrl-trackmania-2020-through-rl"]], "racing_dreamer": [[109, "racing-dreamer"]], "l2r: Multimodal control environment where agents learn how to race": [[109, "l2r-multimodal-control-environment-where-agents-learn-how-to-race"]], "racecar_gym": [[109, "racecar-gym"]], "Other environments": [[109, "other-environments"]], "CompilerGym: Optimise compiler tasks": [[109, "compilergym-optimise-compiler-tasks"]], "CARL: context adaptive RL": [[109, "carl-context-adaptive-rl"]], "matrix-mdp: Easily create discrete MDPs": [[109, "matrix-mdp-easily-create-discrete-mdps"]], "mo-gym: Multi-objective Reinforcement Learning environments": [[109, "mo-gym-multi-objective-reinforcement-learning-environments"]], "gym-cellular-automata: Cellular Automata environments": [[109, "gym-cellular-automata-cellular-automata-environments"]], "gym-sokoban: 2D Transportation Puzzles": [[109, "gym-sokoban-2d-transportation-puzzles"]], "DACBench: Benchmark Library for Dynamic Algorithm configuration": [[109, "dacbench-benchmark-library-for-dynamic-algorithm-configuration"]], "NLPGym: A toolkit to develop RL agents to solve NLP tasks": [[109, "nlpgym-a-toolkit-to-develop-rl-agents-to-solve-nlp-tasks"]], "gym-saturation: Environments used to prove theorems": [[109, "gym-saturation-environments-used-to-prove-theorems"]], "ShinRL: Environments for evaluating RL algorithms": [[109, "shinrl-environments-for-evaluating-rl-algorithms"]], "gymnax: Hardware Accelerated RL Environments": [[109, "gymnax-hardware-accelerated-rl-environments"]], "gym-anytrading: Financial trading environments for FOREX and STOCKS": [[109, "gym-anytrading-financial-trading-environments-for-forex-and-stocks"]], "gym-mtsim: Financial trading for MetaTrader 5 platform": [[109, "gym-mtsim-financial-trading-for-metatrader-5-platform"]], "openmodelica-microgrid-gym: Environments for controlling power electronic converters in microgrids": [[109, "openmodelica-microgrid-gym-environments-for-controlling-power-electronic-converters-in-microgrids"]], "mobile-env: Environments for coordination of wireless mobile networks": [[109, "mobile-env-environments-for-coordination-of-wireless-mobile-networks"]], "GymFC: A flight control tuning and training framework": [[109, "gymfc-a-flight-control-tuning-and-training-framework"]], "Toy Text": [[110, "toy-text"]], "Blackjack": [[111, "blackjack"]], "Information": [[111, "information"], [112, "information"], [113, "information"], [114, "information"]], "Cliff Walking": [[112, "cliff-walking"]], "Frozen Lake": [[113, "frozen-lake"]], "Taxi": [[114, "taxi"]], "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments": [[115, "gymnasium-is-a-standard-api-for-reinforcement-learning-and-a-diverse-collection-of-reference-environments"]], "Solving Blackjack with Q-Learning": [[116, "solving-blackjack-with-q-learning"]], "Imports and Environment Setup": [[116, "imports-and-environment-setup"]], "Observing the environment": [[116, "observing-the-environment"]], "Executing an action": [[116, "executing-an-action"]], "Building an agent": [[116, "building-an-agent"], [119, "building-an-agent"]], "Visualizing the training": [[116, "visualizing-the-training"]], "Visualising the policy": [[116, "visualising-the-policy"]], "Think you can do better?": [[116, "think-you-can-do-better"]], "Make your own custom environment": [[117, "make-your-own-custom-environment"]], "Subclassing gymnasium.Env": [[117, "subclassing-gymnasium-env"]], "Declaration and Initialization": [[117, "declaration-and-initialization"]], "Constructing Observations From Environment States": [[117, "constructing-observations-from-environment-states"]], "Reset": [[117, "reset"]], "Step": [[117, "step"]], "Rendering": [[117, "rendering"]], "Close": [[117, "close"]], "Registering Envs": [[117, "registering-envs"]], "Creating a Package": [[117, "creating-a-package"]], "Creating Environment Instances": [[117, "creating-environment-instances"]], "Using Wrappers": [[117, "using-wrappers"]], "Handling Time Limits": [[118, "handling-time-limits"]], "Termination": [[118, "termination"]], "Truncation": [[118, "truncation"]], "Importance in learning code": [[118, "importance-in-learning-code"]], "Solution": [[118, "solution"]], "Training using REINFORCE for Mujoco": [[119, "training-using-reinforce-for-mujoco"]], "Policy Network": [[119, "policy-network"]], "Plot learning curve": [[119, "plot-learning-curve"]]}, "indexentries": {"env (class in gymnasium)": [[2, "gymnasium.Env"]], "action_space (gymnasium.env attribute)": [[2, "gymnasium.Env.action_space"]], "close() (in module gymnasium.env)": [[2, "gymnasium.Env.close"]], "metadata (gymnasium.env attribute)": [[2, "gymnasium.Env.metadata"]], "np_random (gymnasium.env property)": [[2, "gymnasium.Env.np_random"]], "observation_space (gymnasium.env attribute)": [[2, "gymnasium.Env.observation_space"]], "render() (in module gymnasium.env)": [[2, "gymnasium.Env.render"]], "render_mode (gymnasium.env attribute)": [[2, "gymnasium.Env.render_mode"]], "reset() (in module gymnasium.env)": [[2, "gymnasium.Env.reset"]], "reward_range (gymnasium.env attribute)": [[2, "gymnasium.Env.reward_range"]], "spec (gymnasium.env attribute)": [[2, "gymnasium.Env.spec"]], "step() (in module gymnasium.env)": [[2, "gymnasium.Env.step"]], "unwrapped (gymnasium.env property)": [[2, "gymnasium.Env.unwrapped"]], "funcenv (class in gymnasium.experimental)": [[4, "gymnasium.experimental.FuncEnv"]], "initial() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.initial"], [4, "id0"]], "observation() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.observation"], [4, "id1"]], "render_close() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.render_close"]], "render_image() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.render_image"]], "render_init() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.render_init"]], "reward() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.reward"]], "state_info() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.state_info"]], "step_info() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.step_info"]], "terminal() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.terminal"]], "transform() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.transform"]], "transition() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.transition"]], "cliprewardv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.ClipRewardV0"]], "lambdaactionv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.LambdaActionV0"]], "lambdaobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.LambdaObservationV0"]], "lambdarewardv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.LambdaRewardV0"]], "make() (in module gymnasium)": [[8, "gymnasium.make"]], "pprint_registry() (in module gymnasium)": [[8, "gymnasium.pprint_registry"]], "register() (in module gymnasium)": [[8, "gymnasium.register"]], "spec() (in module gymnasium)": [[8, "gymnasium.spec"]], "space (class in gymnasium.spaces)": [[9, "gymnasium.spaces.Space"]], "contains() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.contains"]], "dtype (space property)": [[9, "Space.dtype"]], "from_jsonable() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.from_jsonable"]], "sample() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.sample"]], "seed() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.seed"]], "shape (gymnasium.spaces.space.space property)": [[9, "gymnasium.spaces.space.Space.shape"]], "to_jsonable() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.to_jsonable"]], "dict (class in gymnasium.spaces)": [[10, "gymnasium.spaces.Dict"]], "graph (class in gymnasium.spaces)": [[10, "gymnasium.spaces.Graph"]], "sequence (class in gymnasium.spaces)": [[10, "gymnasium.spaces.Sequence"]], "tuple (class in gymnasium.spaces)": [[10, "gymnasium.spaces.Tuple"]], "sample() (gymnasium.spaces.dict method)": [[10, "gymnasium.spaces.Dict.sample"]], "sample() (gymnasium.spaces.graph method)": [[10, "gymnasium.spaces.Graph.sample"]], "sample() (gymnasium.spaces.sequence method)": [[10, "gymnasium.spaces.Sequence.sample"]], "sample() (gymnasium.spaces.tuple method)": [[10, "gymnasium.spaces.Tuple.sample"]], "seed() (gymnasium.spaces.dict method)": [[10, "gymnasium.spaces.Dict.seed"]], "seed() (gymnasium.spaces.graph method)": [[10, "gymnasium.spaces.Graph.seed"]], "seed() (gymnasium.spaces.sequence method)": [[10, "gymnasium.spaces.Sequence.seed"]], "seed() (gymnasium.spaces.tuple method)": [[10, "gymnasium.spaces.Tuple.seed"]], "box (class in gymnasium.spaces)": [[11, "gymnasium.spaces.Box"]], "discrete (class in gymnasium.spaces)": [[11, "gymnasium.spaces.Discrete"]], "multibinary (class in gymnasium.spaces)": [[11, "gymnasium.spaces.MultiBinary"]], "multidiscrete (class in gymnasium.spaces)": [[11, "gymnasium.spaces.MultiDiscrete"]], "text (class in gymnasium.spaces)": [[11, "gymnasium.spaces.Text"]], "is_bounded() (gymnasium.spaces.box method)": [[11, "gymnasium.spaces.Box.is_bounded"]], "sample() (gymnasium.spaces.box method)": [[11, "gymnasium.spaces.Box.sample"]], "sample() (gymnasium.spaces.discrete method)": [[11, "gymnasium.spaces.Discrete.sample"]], "sample() (gymnasium.spaces.multibinary method)": [[11, "gymnasium.spaces.MultiBinary.sample"]], "sample() (gymnasium.spaces.multidiscrete method)": [[11, "gymnasium.spaces.MultiDiscrete.sample"]], "sample() (gymnasium.spaces.text method)": [[11, "gymnasium.spaces.Text.sample"]], "seed() (gymnasium.spaces.box method)": [[11, "gymnasium.spaces.Box.seed"]], "seed() (gymnasium.spaces.discrete method)": [[11, "gymnasium.spaces.Discrete.seed"]], "seed() (gymnasium.spaces.multibinary method)": [[11, "gymnasium.spaces.MultiBinary.seed"]], "seed() (gymnasium.spaces.multidiscrete method)": [[11, "gymnasium.spaces.MultiDiscrete.seed"]], "seed() (gymnasium.spaces.text method)": [[11, "gymnasium.spaces.Text.seed"]], "flatdim() (in module gymnasium.spaces.utils)": [[12, "gymnasium.spaces.utils.flatdim"]], "flatten() (in module gymnasium.spaces.utils)": [[12, "gymnasium.spaces.utils.flatten"]], "flatten_space() (in module gymnasium.spaces.utils)": [[12, "gymnasium.spaces.utils.flatten_space"]], "unflatten() (in module gymnasium.spaces.utils)": [[12, "gymnasium.spaces.utils.unflatten"]], "batch_space() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.batch_space"]], "concatenate() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.concatenate"]], "create_empty_array() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.create_empty_array"]], "create_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.create_shared_memory"]], "iterate() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.iterate"]], "read_from_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.read_from_shared_memory"]], "write_to_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.write_to_shared_memory"]], "playplot (class in gymnasium.utils.play)": [[14, "gymnasium.utils.play.PlayPlot"]], "playablegame (class in gymnasium.utils.play)": [[14, "gymnasium.utils.play.PlayableGame"]], "callback() (gymnasium.utils.play.playplot method)": [[14, "gymnasium.utils.play.PlayPlot.callback"]], "capped_cubic_video_schedule() (in module gymnasium.utils.save_video)": [[14, "gymnasium.utils.save_video.capped_cubic_video_schedule"]], "check_env() (in module gymnasium.utils.env_checker)": [[14, "gymnasium.utils.env_checker.check_env"]], "convert_to_done_step_api() (in module gymnasium.utils.step_api_compatibility)": [[14, "gymnasium.utils.step_api_compatibility.convert_to_done_step_api"]], "convert_to_terminated_truncated_step_api() (in module gymnasium.utils.step_api_compatibility)": [[14, "gymnasium.utils.step_api_compatibility.convert_to_terminated_truncated_step_api"]], "np_random() (in module gymnasium.utils.seeding)": [[14, "gymnasium.utils.seeding.np_random"]], "play() (in module gymnasium.utils.play)": [[14, "gymnasium.utils.play.play"]], "process_event() (gymnasium.utils.play.playablegame method)": [[14, "gymnasium.utils.play.PlayableGame.process_event"]], "save_video() (in module gymnasium.utils.save_video)": [[14, "gymnasium.utils.save_video.save_video"]], "step_api_compatibility() (in module gymnasium.utils.step_api_compatibility)": [[14, "gymnasium.utils.step_api_compatibility.step_api_compatibility"]], "asyncvectorenv (class in gymnasium.vector)": [[15, "gymnasium.vector.AsyncVectorEnv"]], "syncvectorenv (class in gymnasium.vector)": [[15, "gymnasium.vector.SyncVectorEnv"]], "vectorenv (class in gymnasium.vector)": [[15, "gymnasium.vector.VectorEnv"]], "action_space": [[15, "action_space"]], "close() (gymnasium.vector.vectorenv method)": [[15, "gymnasium.vector.VectorEnv.close"]], "make() (in module gymnasium.vector)": [[15, "gymnasium.vector.make"]], "observation_space": [[15, "observation_space"]], "reset() (gymnasium.vector.vectorenv method)": [[15, "gymnasium.vector.VectorEnv.reset"]], "single_action_space": [[15, "single_action_space"]], "single_observation_space": [[15, "single_observation_space"]], "step() (gymnasium.vector.vectorenv method)": [[15, "gymnasium.vector.VectorEnv.step"]], "wrapper (class in gymnasium)": [[16, "gymnasium.Wrapper"]], "action_space (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.action_space"]], "close() (in module gymnasium.wrapper)": [[16, "gymnasium.Wrapper.close"]], "metadata (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.metadata"]], "np_random (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.np_random"]], "observation_space (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.observation_space"]], "reset() (in module gymnasium.wrapper)": [[16, "gymnasium.Wrapper.reset"]], "reward_range (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.reward_range"]], "spec (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.spec"]], "step() (in module gymnasium.wrapper)": [[16, "gymnasium.Wrapper.step"]], "unwrapped (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.unwrapped"]], "actionwrapper (class in gymnasium)": [[17, "gymnasium.ActionWrapper"]], "actionwrapper.action() (in module gymnasium.actionwrapper)": [[17, "gymnasium.ActionWrapper.ActionWrapper.action"]], "clipaction (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.ClipAction"]], "rescaleaction (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.RescaleAction"]], "ataripreprocessing (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.AtariPreprocessing"]], "autoresetwrapper (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.AutoResetWrapper"]], "envcompatibility (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.EnvCompatibility"]], "humanrendering (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.HumanRendering"]], "orderenforcing (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.OrderEnforcing"]], "passiveenvchecker (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.PassiveEnvChecker"]], "recordepisodestatistics (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.RecordEpisodeStatistics"]], "recordvideo (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.RecordVideo"]], "rendercollection (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.RenderCollection"]], "stepapicompatibility (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.StepAPICompatibility"]], "timelimit (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.TimeLimit"]], "vectorlistinfo (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.VectorListInfo"]], "filterobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.FilterObservation"]], "flattenobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.FlattenObservation"]], "framestack (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.FrameStack"]], "grayscaleobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.GrayScaleObservation"]], "normalizeobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.NormalizeObservation"]], "observationwrapper (class in gymnasium)": [[19, "gymnasium.ObservationWrapper"]], "pixelobservationwrapper (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.PixelObservationWrapper"]], "resizeobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.ResizeObservation"]], "timeawareobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.TimeAwareObservation"]], "transformobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.TransformObservation"]], "observation() (in module gymnasium.observationwrapper)": [[19, "gymnasium.ObservationWrapper.observation"]], "normalizereward (class in gymnasium.wrappers)": [[20, "gymnasium.wrappers.NormalizeReward"]], "rewardwrapper (class in gymnasium)": [[20, "gymnasium.RewardWrapper"]], "rewardwrapper.reward() (in module gymnasium.rewardwrapper)": [[20, "gymnasium.RewardWrapper.RewardWrapper.reward"]], "transformreward (class in gymnasium.wrappers)": [[20, "gymnasium.wrappers.TransformReward"]]}}) \ No newline at end of file +Search.setIndex({"docnames": ["404", "README", "api/env", "api/experimental", "api/experimental/functional", "api/experimental/vector", "api/experimental/vector_wrappers", "api/experimental/wrappers", "api/registry", "api/spaces", "api/spaces/composite", "api/spaces/fundamental", "api/spaces/utils", "api/spaces/vector_utils", "api/utils", "api/vector", "api/wrappers", "api/wrappers/action_wrappers", "api/wrappers/misc_wrappers", "api/wrappers/observation_wrappers", "api/wrappers/reward_wrappers", "content/basic_usage", "content/gym_compatibility", "content/migration-guide", "environments/atari", "environments/atari/adventure", "environments/atari/air_raid", "environments/atari/alien", "environments/atari/amidar", "environments/atari/assault", "environments/atari/asterix", "environments/atari/asteroids", "environments/atari/atlantis", "environments/atari/bank_heist", "environments/atari/battle_zone", "environments/atari/beam_rider", "environments/atari/berzerk", "environments/atari/bowling", "environments/atari/boxing", "environments/atari/breakout", "environments/atari/carnival", "environments/atari/centipede", "environments/atari/chopper_command", "environments/atari/complete_list", "environments/atari/crazy_climber", "environments/atari/defender", "environments/atari/demon_attack", "environments/atari/double_dunk", "environments/atari/elevator_action", "environments/atari/enduro", "environments/atari/fishing_derby", "environments/atari/freeway", "environments/atari/frostbite", "environments/atari/gopher", "environments/atari/gravitar", "environments/atari/hero", "environments/atari/ice_hockey", "environments/atari/jamesbond", "environments/atari/journey_escape", "environments/atari/kangaroo", "environments/atari/krull", "environments/atari/kung_fu_master", "environments/atari/montezuma_revenge", "environments/atari/ms_pacman", "environments/atari/name_this_game", "environments/atari/phoenix", "environments/atari/pitfall", "environments/atari/pong", "environments/atari/pooyan", "environments/atari/private_eye", "environments/atari/qbert", "environments/atari/riverraid", "environments/atari/road_runner", "environments/atari/robotank", "environments/atari/seaquest", "environments/atari/skiing", "environments/atari/solaris", "environments/atari/space_invaders", "environments/atari/star_gunner", "environments/atari/tennis", "environments/atari/time_pilot", "environments/atari/tutankham", "environments/atari/up_n_down", "environments/atari/venture", "environments/atari/video_pinball", "environments/atari/wizard_of_wor", "environments/atari/zaxxon", "environments/box2d", "environments/box2d/bipedal_walker", "environments/box2d/car_racing", "environments/box2d/lunar_lander", "environments/classic_control", "environments/classic_control/acrobot", "environments/classic_control/cart_pole", "environments/classic_control/mountain_car", "environments/classic_control/mountain_car_continuous", "environments/classic_control/pendulum", "environments/mujoco", "environments/mujoco/ant", "environments/mujoco/half_cheetah", "environments/mujoco/hopper", "environments/mujoco/humanoid", "environments/mujoco/humanoid_standup", "environments/mujoco/inverted_double_pendulum", "environments/mujoco/inverted_pendulum", "environments/mujoco/pusher", "environments/mujoco/reacher", "environments/mujoco/swimmer", "environments/mujoco/walker2d", "environments/third_party_environments", "environments/toy_text", "environments/toy_text/blackjack", "environments/toy_text/cliff_walking", "environments/toy_text/frozen_lake", "environments/toy_text/taxi", "index", "tutorials/blackjack_tutorial", "tutorials/environment_creation", "tutorials/handling_time_limits", "tutorials/reinforce_invpend_gym_v26"], "filenames": ["404.md", "README.md", "api/env.md", "api/experimental.md", "api/experimental/functional.md", "api/experimental/vector.md", "api/experimental/vector_wrappers.md", "api/experimental/wrappers.md", "api/registry.md", "api/spaces.md", "api/spaces/composite.md", "api/spaces/fundamental.md", "api/spaces/utils.md", "api/spaces/vector_utils.md", "api/utils.md", "api/vector.md", "api/wrappers.md", "api/wrappers/action_wrappers.md", "api/wrappers/misc_wrappers.md", "api/wrappers/observation_wrappers.md", "api/wrappers/reward_wrappers.md", "content/basic_usage.md", "content/gym_compatibility.md", "content/migration-guide.md", "environments/atari.md", "environments/atari/adventure.md", "environments/atari/air_raid.md", "environments/atari/alien.md", "environments/atari/amidar.md", "environments/atari/assault.md", "environments/atari/asterix.md", "environments/atari/asteroids.md", "environments/atari/atlantis.md", "environments/atari/bank_heist.md", "environments/atari/battle_zone.md", "environments/atari/beam_rider.md", "environments/atari/berzerk.md", "environments/atari/bowling.md", "environments/atari/boxing.md", "environments/atari/breakout.md", "environments/atari/carnival.md", "environments/atari/centipede.md", "environments/atari/chopper_command.md", "environments/atari/complete_list.md", "environments/atari/crazy_climber.md", "environments/atari/defender.md", "environments/atari/demon_attack.md", "environments/atari/double_dunk.md", "environments/atari/elevator_action.md", "environments/atari/enduro.md", "environments/atari/fishing_derby.md", "environments/atari/freeway.md", "environments/atari/frostbite.md", "environments/atari/gopher.md", "environments/atari/gravitar.md", "environments/atari/hero.md", "environments/atari/ice_hockey.md", "environments/atari/jamesbond.md", "environments/atari/journey_escape.md", "environments/atari/kangaroo.md", "environments/atari/krull.md", "environments/atari/kung_fu_master.md", "environments/atari/montezuma_revenge.md", "environments/atari/ms_pacman.md", "environments/atari/name_this_game.md", "environments/atari/phoenix.md", "environments/atari/pitfall.md", "environments/atari/pong.md", "environments/atari/pooyan.md", "environments/atari/private_eye.md", "environments/atari/qbert.md", "environments/atari/riverraid.md", "environments/atari/road_runner.md", "environments/atari/robotank.md", "environments/atari/seaquest.md", "environments/atari/skiing.md", "environments/atari/solaris.md", "environments/atari/space_invaders.md", "environments/atari/star_gunner.md", "environments/atari/tennis.md", "environments/atari/time_pilot.md", "environments/atari/tutankham.md", "environments/atari/up_n_down.md", "environments/atari/venture.md", "environments/atari/video_pinball.md", "environments/atari/wizard_of_wor.md", "environments/atari/zaxxon.md", "environments/box2d.md", "environments/box2d/bipedal_walker.md", "environments/box2d/car_racing.md", "environments/box2d/lunar_lander.md", "environments/classic_control.md", "environments/classic_control/acrobot.md", "environments/classic_control/cart_pole.md", "environments/classic_control/mountain_car.md", "environments/classic_control/mountain_car_continuous.md", "environments/classic_control/pendulum.md", "environments/mujoco.md", "environments/mujoco/ant.md", "environments/mujoco/half_cheetah.md", "environments/mujoco/hopper.md", "environments/mujoco/humanoid.md", "environments/mujoco/humanoid_standup.md", "environments/mujoco/inverted_double_pendulum.md", "environments/mujoco/inverted_pendulum.md", "environments/mujoco/pusher.md", "environments/mujoco/reacher.md", "environments/mujoco/swimmer.md", "environments/mujoco/walker2d.md", "environments/third_party_environments.md", "environments/toy_text.md", "environments/toy_text/blackjack.md", "environments/toy_text/cliff_walking.md", "environments/toy_text/frozen_lake.md", "environments/toy_text/taxi.md", "index.md", "tutorials/blackjack_tutorial.rst", "tutorials/environment_creation.rst", "tutorials/handling_time_limits.rst", "tutorials/reinforce_invpend_gym_v26.rst"], "titles": ["404 - Page Not Found", "Gymnasium-docs", "Env", "Experimental", "Functional Environment", "Vectorizing Environment", "Vector Environment Wrappers", "Wrappers", "Registry", "Spaces", "Composite Spaces", "Fundamental Spaces", "Spaces Utils", "Spaces Vector Utils", "Utils", "Vector", "Wrappers", "Action Wrappers", "Misc Wrappers", "Observation Wrappers", "Reward Wrappers", "Basic Usage", "Compatibility with Gym", "v21 to v26 Migration Guide", "Atari", "Adventure", "Air Raid", "Alien", "Amidar", "Assault", "Asterix", "Asteroids", "Atlantis", "Bank Heist", "Battle Zone", "Beam Rider", "Berzerk", "Bowling", "Boxing", "Breakout", "Carnival", "Centipede", "Chopper Command", "Complete List - Atari", "Crazy Climber", "Defender", "Demon Attack", "Double Dunk", "Elevator Action", "Enduro", "FishingDerby", "Freeway", "Frostbite", "Gopher", "Gravitar", "Hero", "IceHockey", "Jamesbond", "JourneyEscape", "Kangaroo", "Krull", "Kung Fu Master", "Montezuma Revenge", "Ms Pacman", "Name This Game", "Phoenix", "Pitfall", "Pong", "Pooyan", "PrivateEye", "Qbert", "Riverraid", "Road Runner", "Robot Tank", "Seaquest", "Skiings", "Solaris", "SpaceInvaders", "StarGunner", "Tennis", "TimePilot", "Tutankham", "Up n\u2019 Down", "Venture", "Video Pinball", "Wizard of Wor", "Zaxxon", "Box2D", "Bipedal Walker", "Car Racing", "Lunar Lander", "Classic Control", "Acrobot", "Cart Pole", "Mountain Car", "Mountain Car Continuous", "Pendulum", "MuJoCo", "Ant", "Half Cheetah", "Hopper", "Humanoid", "Humanoid Standup", "Inverted Double Pendulum", "Inverted Pendulum", "Pusher", "Reacher", "Swimmer", "Walker2D", "Third-party Environments", "Toy Text", "Blackjack", "Cliff Walking", "Frozen Lake", "Taxi", "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments", "Solving Blackjack with Q-Learning", "Make your own custom environment", "Handling Time Limits", "Training using REINFORCE for Mujoco"], "terms": {"thi": [1, 2, 3, 4, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 115, 116, 117, 118, 119], "folder": [1, 14, 18, 105, 106], "contain": [1, 2, 3, 9, 12, 13, 15, 16, 18, 19, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 100, 101, 105, 106, 107, 108, 109, 111, 114, 116, 117, 119], "If": [1, 2, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 30, 33, 38, 41, 50, 51, 52, 53, 54, 68, 75, 79, 88, 89, 90, 95, 98, 100, 101, 102, 106, 108, 111, 112, 113, 116, 117], "you": [1, 2, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 98, 101, 102, 105, 106, 109, 115, 117, 118], "ar": [1, 2, 3, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 116, 117, 118, 119], "pleas": [1, 2, 14, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "pr": [1, 23, 109], "repo": [1, 24], "otherwis": [1, 2, 8, 10, 11, 14, 15, 18, 19, 24, 37, 109, 116], "follow": [1, 4, 8, 9, 14, 16, 17, 18, 20, 21, 24, 37, 47, 49, 50, 51, 52, 53, 54, 79, 92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 117, 118, 119], "below": [1, 11, 16, 21, 50, 88, 90, 96, 105, 108, 116, 118], "directli": [1, 10, 16, 18, 21, 92, 109, 116, 117, 119], "markdown": 1, "file": [1, 92, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 117], "repositori": [1, 16, 97], "fork": [1, 23, 109, 115], "docstr": 1, "": [1, 2, 4, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 24, 44, 50, 51, 52, 53, 54, 56, 57, 60, 61, 62, 67, 68, 70, 87, 88, 89, 90, 91, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119], "python": [1, 8, 13, 18, 21, 88, 89, 90, 115, 116, 117, 118, 119], "Then": [1, 16, 17, 21, 74, 107], "pip": [1, 24, 87, 91, 97, 117], "instal": [1, 14, 18, 32, 87, 91, 97, 117], "your": [1, 2, 15, 16, 17, 18, 19, 20, 21, 27, 28, 30, 32, 33, 35, 37, 38, 39, 41, 47, 49, 50, 51, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 67, 69, 70, 71, 72, 73, 74, 75, 76, 77, 80, 81, 82, 83, 84, 85, 86, 89, 98, 101, 102, 115, 116], "run": [1, 2, 8, 15, 18, 33, 55, 58, 66, 71, 72, 75, 76, 88, 90, 92, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 112, 117], "script": [1, 116], "gen_md": 1, "py": [1, 13, 24, 88, 89, 90, 97, 98, 101, 102, 112, 116, 117, 118, 119], "automat": [1, 2, 8, 15, 16, 18, 22, 23, 117], "gener": [1, 2, 9, 10, 11, 14, 15, 16, 18, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 115, 117], "For": [1, 2, 4, 11, 12, 14, 16, 18, 19, 21, 22, 23, 24, 25, 27, 28, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 45, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 89, 90, 97, 112, 113, 114, 116, 117], "add": [1, 8, 14, 15, 19, 21, 89, 97, 101, 102, 114, 116, 117], "complet": [1, 16, 18, 21, 23, 24, 44, 57, 69, 70, 89, 90, 116, 118], "ensur": [1, 2, 8, 10, 12, 14, 21, 116, 117], "i": [1, 2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 117, 118, 119], "ha": [1, 2, 3, 9, 11, 12, 14, 16, 18, 19, 20, 21, 23, 24, 54, 74, 88, 89, 90, 91, 97, 98, 99, 100, 101, 102, 105, 106, 107, 108, 109, 111, 115, 116, 117, 118, 119], "properli": [1, 9], "format": [1, 9, 14, 16, 18, 19, 21], "md": [1, 117], "correspond": [1, 2, 8, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 93, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 114, 117, 119], "gif": [1, 92], "_static": 1, "video": [1, 16, 43, 73, 88], "env_typ": 1, "where": [1, 3, 7, 8, 10, 11, 12, 14, 16, 18, 19, 21, 23, 24, 47, 89, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 116, 117, 118, 119], "categori": 1, "e": [1, 2, 3, 9, 11, 12, 13, 15, 16, 18, 19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 105, 106, 109, 111, 113, 116, 117, 119], "g": [1, 2, 9, 11, 12, 13, 15, 16, 75, 92, 96, 109, 113, 114, 116, 117, 119], "mujoco": [1, 16, 21, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "snake_cas": 1, "name": [1, 3, 4, 8, 16, 43, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 117], "convent": [1, 2, 24], "altern": [1, 24], "gen_gif": 1, "index": [1, 13, 14, 18, 19, 21, 24, 93, 102], "toctre": 1, "requir": [1, 2, 9, 19, 97, 116, 119], "packag": [1, 18, 109], "cd": [1, 117], "r": [1, 7, 11, 18, 20, 73, 92, 96, 109, 111, 112, 114, 119], "txt": 1, "To": [1, 8, 13, 15, 18, 19, 20, 21, 22, 23, 24, 32, 42, 70, 88, 89, 90, 92, 114, 116, 117, 119], "builder": 1, "onc": [1, 18, 31, 41, 48, 55, 103, 106, 114, 116, 117], "make": [1, 2, 7, 10, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 116, 119], "dirhtml": 1, "_build": 1, "rebuild": [1, 32], "everi": [1, 14, 18, 21, 41, 42, 46, 51, 73, 74, 83, 89, 90, 93, 98, 100, 101, 108, 109, 117, 119], "time": [1, 2, 8, 10, 14, 15, 16, 24, 40, 43, 46, 47, 48, 52, 56, 58, 59, 66, 70, 71, 72, 73, 74, 75, 88, 89, 96, 98, 99, 100, 101, 102, 107, 108, 109, 112, 114, 116, 117, 119], "chang": [1, 2, 3, 4, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 52, 60, 70, 89, 92, 93, 94, 95, 96, 97, 105, 106, 109, 114, 116, 117, 119], "made": [1, 3, 105, 106], "sphinx": 1, "autobuild": 1, "b": [1, 11, 105, 106, 114], "we": [1, 2, 3, 4, 11, 18, 19, 20, 21, 23, 24, 98, 101, 102, 116, 117, 118, 119], "us": [1, 2, 3, 4, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 113, 114, 116, 118], "galleri": 1, "insid": [1, 10, 11, 18, 117], "directori": 1, "check": [1, 2, 11, 18, 114, 116, 117], "demo": 1, "see": [1, 2, 9, 14, 15, 21, 23, 24, 25, 28, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 45, 55, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 90, 92, 98, 99, 100, 101, 107, 108, 109, 113, 117], "exampl": [1, 2, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 89, 92, 111, 112, 113, 116, 117, 118], "more": [1, 2, 3, 9, 10, 11, 14, 15, 16, 19, 23, 24, 25, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 45, 50, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88, 90, 97, 98, 101, 102, 103, 104, 105, 106, 107, 109, 116, 117, 118, 119], "inform": [1, 2, 9, 10, 11, 14, 15, 16, 18, 19, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 116, 117, 118, 119], "convert": [1, 8, 9, 10, 16, 18, 19, 22, 23, 89, 116], "jupyt": [1, 116, 117, 118, 119], "notebook": [1, 116, 117, 118, 119], "can": [1, 2, 3, 8, 9, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 117, 119], "want": [1, 2, 10, 15, 16, 17, 18, 20, 21, 33, 55, 116, 117], "execut": [1, 14, 17, 24, 47, 114, 117, 119], "which": [1, 2, 8, 9, 10, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 44, 46, 48, 62, 89, 90, 92, 93, 97, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 109, 112, 113, 114, 117, 118, 119], "output": [1, 13, 14, 18, 21, 116, 119], "plot": [1, 14, 116], "should": [1, 2, 9, 11, 14, 15, 18, 19, 21, 23, 105, 106, 116, 117], "start": [1, 2, 9, 11, 14, 15, 18, 34, 47, 48, 54, 58, 59, 74, 116, 119], "run_": 1, "note": [1, 9, 13, 18, 92, 93, 98, 101, 102, 114, 116, 118, 119], "so": [1, 14, 15, 16, 18, 19, 21, 24, 52, 75, 90, 91, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 113, 116, 117, 118], "sure": [1, 2, 18, 117], "doesn": [1, 2, 8, 16, 18, 24, 90, 118], "t": [1, 2, 8, 10, 12, 14, 16, 18, 19, 20, 23, 24, 40, 50, 51, 52, 53, 54, 73, 74, 89, 90, 94, 95, 114, 116, 117, 118], "take": [1, 2, 4, 7, 8, 11, 12, 14, 15, 16, 17, 18, 21, 23, 24, 77, 91, 93, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 114, 116, 119], "than": [1, 23, 50, 56, 74, 90, 92, 93, 94, 95, 99, 103, 104, 105, 107, 109, 111, 116], "few": [1, 92, 116], "second": [1, 10, 14, 15, 37, 68, 75, 90, 99, 103, 106, 107], "class": [2, 3, 4, 7, 9, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 97, 116, 117, 119], "The": [2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 115, 116, 117, 118, 119], "main": [2, 90, 100, 108], "reinforc": [2, 9, 21, 92, 107, 110, 111, 112, 114, 116, 118], "learn": [2, 9, 10, 18, 19, 20, 21, 24, 50, 51, 52, 53, 54, 88, 89, 90, 92, 93, 94, 95, 99, 102, 103, 104, 107, 110, 111, 112, 114, 117], "agent": [2, 3, 9, 16, 18, 19, 21, 23, 24, 48, 57, 88, 89, 90, 94, 98, 99, 100, 101, 102, 103, 104, 107, 108, 117, 118], "encapsul": 2, "an": [2, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 105, 106, 107, 108, 109, 111, 112, 113, 114, 117, 118], "arbitrari": [2, 8, 11, 14, 19, 20, 109], "behind": [2, 68], "scene": [2, 68, 109], "dynam": [2, 24, 39, 50, 51, 52, 53, 54, 92, 96, 97, 103], "through": [2, 8, 9, 15, 22, 23, 24, 39, 55, 58, 61, 62, 66, 75, 76, 101, 102, 118], "step": [2, 7, 8, 15, 16, 17, 18, 19, 20, 21, 24, 88, 90, 92, 93, 96, 112, 113, 114, 115, 116, 118, 119], "reset": [2, 7, 8, 14, 15, 16, 18, 19, 20, 21, 92, 93, 94, 95, 96, 109, 112, 113, 114, 115, 116, 119], "function": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 90, 96, 106, 109, 113, 114, 116, 118, 119], "partial": 2, "fulli": 2, "observ": [2, 4, 9, 10, 13, 14, 15, 16, 17, 18, 20, 23, 109, 115, 118, 119], "singl": [2, 4, 9, 10, 11, 12, 13, 14, 15, 19, 21, 100, 101, 102, 108, 117, 119], "multi": [2, 11, 97, 101, 102, 105], "pettingzoo": 2, "api": [2, 4, 16, 18, 21, 23, 117, 118], "user": [2, 4, 8, 15, 21, 23, 24, 92, 93, 94, 95, 96, 109, 117, 119], "need": [2, 8, 9, 10, 14, 16, 17, 18, 19, 21, 23, 42, 44, 49, 55, 59, 69, 74, 88, 90, 93, 97, 116, 117, 118], "know": [2, 18, 21, 117], "updat": [2, 14, 18, 19, 21, 22, 23, 114, 116, 117, 118, 119], "action": [2, 4, 8, 9, 10, 11, 14, 15, 16, 18, 23, 43, 91, 109, 110, 115, 117, 119], "return": [2, 4, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 112, 113, 114, 116, 117, 118, 119], "next": [2, 4, 13, 21, 23, 44, 46, 48, 119], "reward": [2, 4, 8, 14, 15, 16, 18, 21, 23, 97, 109, 115, 116, 117, 118, 119], "termin": [2, 4, 8, 14, 15, 16, 18, 20, 21, 22, 23, 92, 93, 94, 95, 98, 100, 101, 102, 103, 104, 105, 106, 108, 111, 112, 113, 114, 115, 116, 117, 119], "truncat": [2, 8, 14, 15, 16, 18, 20, 21, 22, 23, 92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 113, 114, 115, 116, 117, 119], "due": [2, 23, 113, 118], "latest": [2, 119], "from": [2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 26, 40, 47, 52, 53, 56, 58, 67, 68, 80, 86, 88, 89, 90, 92, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 118, 119], "about": [2, 4, 14, 19, 21, 69, 92, 98, 101, 102, 116, 117, 118, 119], "metric": [2, 14, 23], "debug": [2, 9, 14, 110], "info": [2, 4, 14, 15, 16, 19, 20, 21, 23, 98, 99, 100, 101, 105, 106, 107, 108, 114, 115, 116, 117, 118, 119], "initi": [2, 4, 7, 8, 10, 11, 15, 16, 17, 18, 19, 20, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 119], "state": [2, 4, 16, 18, 19, 21, 23, 24, 91, 97, 109, 110, 116, 118, 119], "befor": [2, 8, 14, 15, 16, 17, 18, 19, 20, 32, 44, 58, 69, 76, 77, 89, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 117, 119], "call": [2, 3, 8, 12, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 37, 56, 105, 106, 111, 113, 116, 117], "first": [2, 14, 15, 16, 18, 19, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 117, 119], "episod": [2, 8, 14, 16, 19, 23, 116, 117, 118, 119], "render": [2, 4, 15, 16, 19, 21, 24, 87, 88, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 116], "help": [2, 9, 21, 27, 59, 62, 105, 116], "visualis": [2, 21], "what": [2, 9, 18, 24, 112], "mode": [2, 15, 16, 18, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 116, 117], "human": [2, 10, 16, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 101, 102, 105, 115, 117], "rgb_arrai": [2, 14, 16, 18, 19, 24, 117], "ansi": [2, 117], "text": [2, 9, 10, 12, 21, 111, 112, 113, 114], "close": [2, 4, 11, 14, 15, 16, 21, 23, 44, 69, 98, 100, 101, 106, 108, 115, 116], "import": [2, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 117, 119], "when": [2, 9, 10, 12, 13, 14, 15, 16, 18, 19, 20, 22, 24, 27, 40, 44, 45, 46, 48, 50, 51, 52, 53, 54, 56, 57, 71, 72, 73, 74, 77, 89, 90, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 112, 113, 114, 117, 118, 119], "extern": [2, 23, 98, 101, 102, 118], "softwar": [2, 109], "pygam": [2, 14, 23, 87, 117], "databas": 2, "have": [2, 8, 11, 12, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 30, 32, 33, 37, 39, 41, 42, 44, 45, 50, 51, 52, 53, 54, 55, 58, 59, 60, 64, 66, 68, 74, 76, 87, 88, 89, 92, 98, 99, 100, 101, 102, 104, 105, 107, 108, 109, 111, 113, 114, 116, 117, 118, 119], "understand": [2, 12, 15, 105, 109, 119], "action_spac": [2, 14, 15, 16, 17, 19, 20, 21, 23, 114, 115, 116, 117, 119], "space": [2, 3, 14, 15, 16, 17, 18, 19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 97, 109, 110, 117, 119], "object": [2, 9, 13, 16, 21, 25, 30, 44, 50, 51, 59, 71, 77, 105, 116, 119], "valid": [2, 8, 9, 11, 13, 15, 16, 17, 18, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 116], "all": [2, 3, 10, 11, 15, 16, 18, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 51, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 89, 90, 91, 92, 93, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 116, 119], "within": [2, 9, 17, 19, 21, 23, 62, 66, 90, 91, 103, 104], "observation_spac": [2, 10, 11, 15, 16, 19, 21, 117, 119], "reward_rang": [2, 16, 20], "A": [2, 4, 7, 9, 10, 11, 12, 14, 15, 17, 18, 19, 20, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 92, 93, 95, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 112, 113, 116, 117, 118, 119], "tupl": [2, 4, 9, 11, 12, 13, 14, 16, 19, 21, 23, 24, 98, 100, 101, 108, 111, 116, 117, 119], "minimum": [2, 11, 96], "maximum": [2, 8, 11, 14, 18, 21, 73, 74, 90, 92, 96, 103, 117], "possibl": [2, 10, 11, 12, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 93, 94, 95, 99, 101, 103, 104, 107, 108, 109, 112, 113, 114, 116, 117], "over": [2, 13, 18, 20, 27, 33, 56, 66, 71, 99, 101, 111, 113, 116], "default": [2, 8, 9, 10, 11, 14, 15, 16, 18, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 92, 96, 98, 99, 100, 101, 105, 106, 107, 108, 117, 118], "rang": [2, 13, 14, 16, 17, 18, 20, 21, 22, 23, 24, 56, 88, 91, 92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 116, 117, 119], "set": [2, 10, 11, 15, 16, 17, 18, 19, 23, 24, 25, 26, 27, 28, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 83, 84, 85, 87, 90, 91, 92, 94, 95, 97, 98, 99, 100, 101, 105, 106, 107, 108, 109, 113, 116, 117, 118, 119], "infti": [2, 11], "spec": [2, 15, 16, 18], "metadata": [2, 14, 16, 18, 24, 117], "fp": [2, 14, 24, 117], "np_random": [2, 14, 16, 18, 23, 117], "random": [2, 9, 10, 11, 14, 18, 19, 21, 24, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 106, 107, 108, 109, 113, 114, 116, 117, 119], "number": [2, 3, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 21, 22, 24, 26, 27, 28, 29, 30, 31, 32, 35, 36, 37, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 58, 61, 63, 64, 65, 67, 68, 70, 73, 75, 77, 78, 80, 81, 82, 84, 85, 89, 90, 92, 100, 101, 102, 107, 108, 109, 111, 113, 117, 119], "assign": [2, 75, 93, 94, 95, 105, 106], "dure": [2, 10, 11, 15, 16, 18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 98, 99, 100, 101, 107, 108, 114, 117], "super": [2, 16, 17, 19, 20, 23, 117, 119], "seed": [2, 8, 9, 10, 11, 15, 16, 21, 72, 115, 117, 119], "assess": 2, "self": [2, 4, 9, 10, 16, 17, 18, 19, 20, 95, 109, 116, 117, 119], "modifi": [2, 7, 9, 15, 16, 17, 19, 20, 23, 92, 105, 106, 114, 117], "extend": 2, "wrapper": [2, 8, 10, 11, 14, 15, 21, 22, 23, 105, 106, 109, 113, 114, 115, 116, 119], "acttyp": [2, 4, 14, 16, 17, 19, 20], "obstyp": [2, 4, 14, 16, 17, 19, 20, 23, 119], "supportsfloat": [2, 8, 11, 16, 20, 23, 119], "bool": [2, 8, 9, 11, 14, 15, 16, 18, 19, 23, 24, 90, 98, 99, 100, 101, 107, 108, 116, 117, 119], "dict": [2, 4, 8, 9, 11, 12, 13, 14, 15, 16, 18, 19, 21, 23, 112, 113, 114, 117, 119], "str": [2, 4, 8, 9, 10, 11, 12, 14, 15, 16, 18, 19, 23, 24, 98, 99, 100, 101, 107, 108, 116, 119], "ani": [2, 4, 7, 8, 9, 10, 11, 12, 13, 14, 16, 18, 19, 23, 24, 46, 50, 51, 52, 53, 54, 55, 73, 90, 93, 98, 100, 101, 102, 103, 104, 105, 106, 107, 108, 113, 116, 117, 118, 119], "one": [2, 10, 11, 12, 14, 15, 16, 18, 19, 21, 22, 23, 26, 27, 28, 32, 37, 44, 47, 48, 60, 69, 70, 71, 73, 74, 79, 92, 93, 94, 95, 96, 98, 100, 102, 103, 104, 106, 107, 111, 114, 116, 118, 119], "timestep": [2, 18, 19, 21, 94, 95, 98, 100, 101, 102, 103, 104, 105, 106, 108, 117, 119], "end": [2, 4, 16, 18, 21, 32, 41, 42, 44, 46, 48, 49, 57, 58, 59, 69, 73, 76, 77, 88, 96, 116, 118, 119], "reach": [2, 16, 32, 34, 44, 47, 48, 65, 68, 76, 77, 91, 92, 93, 94, 95, 98, 100, 101, 102, 103, 104, 105, 106, 108, 112, 113, 114, 116, 117, 118, 119], "necessari": [2, 9, 24, 50, 51, 52, 53, 54], "version": [2, 3, 8, 9, 16, 93, 116, 117, 118], "0": [2, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116, 117, 118, 119], "26": [2, 22, 98, 101, 102, 117, 118, 119], "wa": [2, 14, 15, 16, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 100, 101, 107, 108, 118, 119], "remov": [2, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 114], "done": [2, 8, 14, 16, 18, 21, 22, 23, 98, 100, 101, 102, 103, 104, 108, 116, 117, 118, 119], "favor": 2, "clearer": 2, "had": 2, "critic": [2, 18], "bootstrap": [2, 23, 118], "algorithm": [2, 9, 97, 110, 114, 116, 118, 119], "paramet": [2, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 107, 108, 117, 119], "provid": [2, 3, 7, 9, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 24, 30, 44, 46, 50, 51, 52, 53, 54, 88, 92, 109, 117], "element": [2, 9, 10, 11, 13, 15, 19, 21, 93, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 117], "numpi": [2, 3, 4, 9, 11, 13, 15, 16, 17, 19, 23, 109, 116, 117, 119], "arrai": [2, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 90, 109, 116, 117, 119], "posit": [2, 10, 11, 12, 13, 14, 18, 19, 21, 24, 35, 56, 88, 89, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 112, 113, 114, 116, 117], "veloc": [2, 10, 12, 13, 88, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "pole": [2, 75, 91, 103, 104, 109, 119], "cartpol": [2, 7, 8, 14, 15, 18, 19, 20, 21, 91, 93, 103, 104, 109, 119], "result": [2, 3, 12, 14, 15, 21, 92, 98, 101, 102, 110, 112, 114, 116], "whether": [2, 4, 8, 11, 14, 18, 23, 37, 90, 98, 99, 100, 101, 107, 108, 111, 116, 117, 118, 119], "defin": [2, 4, 9, 12, 16, 17, 18, 19, 20, 21, 96, 101, 117, 118], "under": [2, 19, 20, 116, 119], "mdp": [2, 18, 21, 94, 95], "task": [2, 10, 16, 19, 21, 60, 66, 69, 89, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 114, 117, 118, 119], "neg": [2, 11, 14, 21, 75, 95, 98, 99, 101, 102, 103, 105, 106, 114, 119], "goal": [2, 27, 30, 35, 37, 39, 41, 44, 56, 61, 62, 63, 64, 65, 67, 70, 72, 74, 75, 81, 82, 83, 84, 85, 86, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 117, 119], "move": [2, 3, 16, 20, 21, 23, 26, 29, 30, 39, 40, 54, 57, 68, 71, 74, 75, 88, 90, 93, 98, 99, 100, 102, 103, 104, 105, 106, 107, 108, 109, 112, 113, 114, 117, 118, 119], "lava": [2, 21, 55], "sutton": [2, 92, 93, 103, 104, 111, 112, 116], "barton": 2, "gridworld": [2, 109, 112, 117], "true": [2, 8, 12, 14, 15, 17, 18, 19, 21, 22, 24, 50, 51, 52, 53, 54, 88, 89, 90, 98, 99, 100, 101, 107, 108, 111, 113, 116, 117, 119], "condit": [2, 116, 118, 119], "outsid": [2, 89, 90, 118], "scope": [2, 118], "satisfi": 2, "typic": [2, 14, 114], "timelimit": [2, 8, 16, 18, 21, 117, 118], "could": [2, 14, 19, 20, 21, 24, 116, 117, 118, 119], "also": [2, 8, 11, 14, 15, 16, 18, 19, 21, 24, 36, 57, 58, 69, 70, 72, 88, 89, 90, 91, 97, 98, 99, 100, 101, 107, 108, 109, 116, 117, 118, 119], "indic": [2, 14, 18, 23, 89, 92, 93, 98, 101, 102, 111, 112, 113, 114, 116, 118, 119], "physic": [2, 87, 97, 103, 104, 119], "go": [2, 48, 75, 79, 89, 111, 116, 118, 119], "out": [2, 4, 13, 24, 33, 38, 55, 58, 66, 71, 76, 117, 118, 119], "bound": [2, 7, 11, 16, 17, 21, 23, 90, 92, 93, 94, 95, 96, 118], "prematur": 2, "auxiliari": [2, 117], "diagnost": 2, "log": [2, 119], "might": [2, 9, 11, 12, 16, 17, 18, 19, 20, 23, 116, 117, 119], "instanc": [2, 4, 8, 9, 10, 12, 13, 14, 15, 16, 18, 20, 21, 109], "describ": [2, 10, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 93, 107, 111], "perform": [2, 3, 14, 18, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 106, 109, 119], "variabl": [2, 9, 11, 15, 18, 100, 107, 108, 109, 116, 117, 118, 119], "hidden": [2, 97, 119], "individu": [2, 3, 16, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 117, 119], "term": [2, 16, 91, 92, 97, 98, 99, 100, 101, 105, 106, 107, 108, 117], "combin": [2, 9, 14, 16, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 106], "produc": [2, 16, 18, 102, 117], "total": [2, 44, 88, 89, 90, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 114, 119], "In": [2, 3, 11, 14, 15, 16, 17, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 91, 92, 98, 99, 100, 101, 107, 108, 114, 116, 117, 118, 119], "openai": [2, 8, 15, 16, 21, 23, 87, 115, 116, 118, 119], "gym": [2, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 87, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 115, 116, 117, 118, 119], "v26": [2, 119], "distinguish": [2, 117, 118], "howev": [2, 3, 8, 9, 10, 11, 12, 15, 16, 17, 18, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 98, 99, 100, 101, 105, 106, 116, 117, 118], "deprec": 2, "favour": [2, 22, 23], "boolean": [2, 9, 14, 18, 23, 90, 116, 119], "valu": [2, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 21, 23, 24, 74, 88, 90, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116, 118, 119], "case": [2, 4, 9, 10, 11, 16, 17, 19, 21, 23, 57, 69, 89, 98, 99, 100, 101, 107, 108, 114, 117, 118, 119], "further": [2, 23, 74, 90, 105, 106, 119], "undefin": 2, "signal": [2, 16, 18, 21, 98, 100, 101, 108, 114, 117, 118], "mai": [2, 11, 12, 14, 15, 17, 18, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 100, 101, 107, 108, 113, 117], "emit": [2, 16, 18], "differ": [2, 9, 10, 14, 15, 16, 17, 18, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 96, 98, 99, 100, 101, 102, 103, 104, 108, 109, 117, 118], "reason": [2, 23, 90], "mayb": 2, "underli": [2, 16, 18, 21, 92], "solv": [2, 88, 91, 93, 97, 103, 104, 117, 119], "successfulli": [2, 114], "certain": [2, 47, 49, 103, 104, 106, 116], "exceed": [2, 16, 18, 21, 98, 100, 101, 108, 116], "simul": [2, 24, 50, 51, 52, 53, 54, 97, 101, 102, 103, 104, 116, 119], "enter": [2, 14, 31, 33, 60, 90, 112], "invalid": [2, 11, 116], "int": [2, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 24, 111, 112, 113, 114, 116, 117, 119], "none": [2, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 23, 113, 116, 117], "option": [2, 4, 7, 8, 9, 10, 11, 14, 15, 16, 18, 19, 21, 23, 89, 92, 93, 94, 95, 96, 117], "intern": [2, 4, 15, 19], "new": [2, 3, 9, 16, 17, 18, 19, 21, 22, 23, 28, 31, 33, 46, 92, 93, 94, 95, 96, 106, 109, 114, 116, 117, 118], "often": [2, 9, 97, 117], "some": [2, 9, 10, 11, 15, 16, 18, 19, 20, 21, 23, 24, 40, 48, 66, 89, 91, 92, 97, 106, 107, 114, 116, 117], "explor": [2, 9, 54, 109, 116], "generalis": 2, "polici": [2, 19, 20, 21, 23, 91, 97, 98, 99, 100, 101, 102, 107, 108, 109, 115, 118], "control": [2, 9, 11, 20, 21, 23, 24, 26, 29, 31, 32, 33, 34, 35, 40, 42, 45, 52, 53, 54, 57, 59, 66, 67, 69, 71, 72, 73, 74, 75, 76, 79, 80, 87, 89, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "alreadi": [2, 3, 16, 19, 21], "rng": [2, 4, 9, 10, 11, 117], "therefor": [2, 3, 9, 15, 23], "right": [2, 11, 24, 26, 28, 29, 30, 31, 35, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 59, 61, 63, 64, 65, 67, 70, 75, 77, 78, 80, 81, 84, 85, 88, 89, 90, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 107, 108, 112, 113, 114, 116, 117, 119], "after": [2, 4, 8, 14, 15, 18, 19, 21, 32, 36, 41, 47, 51, 55, 77, 90, 98, 99, 100, 101, 102, 107, 108, 111, 114, 116, 117, 118, 119], "never": 2, "again": [2, 90, 117], "custom": [2, 7, 9, 14, 15, 19, 21, 23, 24, 50, 51, 52, 53, 54, 107, 109, 113], "line": [2, 23, 47, 92, 114, 117], "correctli": [2, 19, 20, 117], "v0": [2, 3, 8, 15, 16, 18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 117, 118, 119], "25": [2, 12, 24, 50, 51, 52, 53, 54, 98, 100, 101, 102, 108, 114], "return_info": 2, "now": [2, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 116, 117, 118, 119], "expect": [2, 9, 10, 11, 15, 18, 21, 119], "prng": [2, 9, 10, 11], "doe": [2, 8, 10, 12, 14, 15, 16, 18, 22, 36, 52, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 117, 118], "pass": [2, 4, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 90, 98, 99, 100, 101, 107, 108, 117], "chosen": [2, 11, 24], "sourc": [2, 97, 109, 116, 117, 118, 119], "entropi": 2, "timestamp": 2, "dev": [2, 119], "urandom": 2, "integ": [2, 10, 11, 12, 14, 18, 19, 23, 24, 117], "even": [2, 8, 25, 27, 33, 34, 36, 38, 41, 42, 45, 55, 56, 57, 59, 60, 62, 66, 69, 71, 72, 73, 74, 76, 79, 83, 86, 102, 116, 117], "exist": [2, 8, 9, 15, 16, 21], "usual": [2, 10, 11, 16, 18, 24, 50, 51, 52, 53, 54, 56, 100, 116, 117], "been": [2, 14, 18, 21, 23, 98, 101, 102, 109, 117, 118], "refer": [2, 14, 18, 21, 23, 117, 118], "minim": [2, 117, 118, 119], "abov": [2, 10, 11, 14, 22, 23, 24, 50, 51, 52, 53, 54, 92, 93, 96, 97, 119], "paradigm": 2, "specifi": [2, 9, 10, 11, 14, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 90, 91, 96, 100, 101, 105, 106, 108, 110, 113, 114, 117], "how": [2, 9, 14, 15, 21, 56, 58, 59, 102, 103, 105, 106, 116, 117, 118, 119], "depend": [2, 3, 10, 14, 19, 20, 24, 26, 27, 28, 29, 30, 31, 32, 35, 36, 37, 39, 40, 42, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 59, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 87, 91, 93, 97, 98, 99, 100, 101, 107, 108, 109, 113], "specif": [2, 8, 11, 18, 118, 119], "analog": [2, 24], "dictionari": [2, 9, 10, 14, 15, 16, 18, 19, 21, 116, 117, 119], "complement": 2, "It": [2, 8, 10, 11, 14, 15, 16, 18, 21, 24, 25, 26, 27, 28, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 83, 84, 85, 88, 97, 98, 99, 100, 101, 102, 105, 106, 107, 108, 109, 116, 117, 119], "renderfram": [2, 14], "list": [2, 8, 9, 10, 11, 14, 15, 16, 19, 21, 24, 116], "comput": [2, 14, 67, 79, 98, 103, 105, 106, 109, 116, 117], "frame": [2, 14, 18, 19, 24, 37, 89, 90, 102, 105], "render_mod": [2, 14, 15, 16, 18, 19, 21, 23, 24, 115, 117], "wai": [2, 10, 16, 21, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 116, 118], "most": [2, 9, 16, 18, 19, 21, 23, 24, 50, 51, 52, 53, 54, 106, 116, 117], "achiev": [2, 24, 27, 92, 111], "appli": [2, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 88, 90, 91, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 116, 117, 119], "collect": [2, 3, 15, 27, 30, 48, 62, 63, 66, 82, 109, 116], "As": [2, 3, 15, 16, 21, 80, 92, 97, 98, 99, 101, 102, 110, 112, 114, 119], "known": [2, 18, 31], "__init__": [2, 10, 13, 16, 17, 19, 20, 116, 117, 119], "initialis": [2, 18, 23, 111], "By": [2, 8, 18, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 98, 99, 100, 101, 107, 108], "continu": [2, 9, 16, 17, 21, 29, 30, 89, 90, 91, 94, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 116, 118, 119], "current": [2, 3, 11, 14, 16, 18, 19, 24, 89, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 116, 117, 119], "displai": [2, 8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 93, 117], "consumpt": 2, "occur": [2, 18, 92, 93, 117], "repres": [2, 10, 11, 14, 21, 23, 90, 92, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 112, 113, 114, 115, 117, 119], "np": [2, 7, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 90, 114, 116, 117, 119], "ndarrai": [2, 4, 7, 8, 10, 11, 12, 13, 14, 17, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 114, 119], "shape": [2, 9, 10, 11, 12, 13, 16, 17, 18, 19, 21, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 117, 119], "x": [2, 9, 12, 90, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 109, 112, 117, 119], "y": [2, 24, 90, 96, 98, 99, 101, 102, 103, 105, 106, 107, 114, 119], "3": [2, 7, 8, 10, 11, 12, 13, 14, 15, 18, 19, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116, 117, 119], "rgb": [2, 16, 18, 19, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 98, 99, 100, 101, 102, 103, 104, 107, 108], "pixel": [2, 16, 89, 109, 117], "imag": [2, 9, 15, 16, 18, 19, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89], "string": [2, 8, 9, 11, 14, 19], "stringio": 2, "style": [2, 15, 18, 109, 119], "represent": [2, 21, 118], "each": [2, 3, 8, 9, 10, 11, 14, 15, 16, 17, 19, 21, 24, 44, 46, 47, 48, 49, 52, 60, 67, 69, 70, 71, 72, 73, 74, 75, 87, 88, 90, 91, 92, 93, 94, 95, 98, 101, 102, 103, 104, 105, 109, 110, 112, 114, 116, 117], "includ": [2, 8, 19, 21, 22, 23, 24, 93, 98, 99, 100, 101, 103, 104, 105, 106, 107, 108, 109, 114, 117, 118], "newlin": 2, "escap": [2, 43, 58, 62], "sequenc": [2, 8, 9, 11, 12, 15, 19, 21, 24, 109], "color": [2, 10, 28, 39, 52, 70, 114], "rgb_array_list": [2, 14, 16, 18], "ansi_list": 2, "base": [2, 3, 4, 9, 10, 15, 16, 17, 18, 19, 20, 21, 48, 57, 74, 87, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 114, 116, 117, 119], "except": [2, 71, 74, 117], "rendercollect": [2, 3, 16, 18], "pop": [2, 106], "kei": [2, 8, 9, 10, 11, 14, 15, 16, 18, 19, 21, 24, 25, 56, 98, 99, 100, 101, 105, 106, 107, 108, 112, 113, 114, 116, 117, 118], "support": [2, 3, 9, 10, 12, 14, 15, 16, 18, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 117], "longer": [2, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 100, 101, 102, 103, 104, 105, 106, 108, 109, 119], "accept": [2, 14, 18, 24, 117], "rather": [2, 23, 89, 109, 116], "v1": [2, 7, 8, 14, 15, 18, 19, 20, 21, 88, 89, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 113, 114, 116], "type": [2, 9, 10, 11, 15, 16, 17, 19, 21, 23, 46, 89, 98, 99, 100, 101, 107, 108, 109, 117, 119], "discret": [2, 9, 10, 12, 13, 15, 17, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 90, 92, 93, 94, 95, 110, 111, 112, 113, 114, 116, 117], "give": [2, 27, 28, 46, 47, 90, 105, 111, 114, 116, 119], "2": [2, 7, 10, 11, 12, 13, 14, 15, 17, 19, 20, 24, 25, 26, 28, 29, 30, 31, 32, 34, 35, 37, 39, 40, 42, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 79, 80, 81, 82, 84, 85, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 117, 119], "mean": [2, 21, 23, 92, 98, 99, 100, 105, 117, 119], "two": [2, 10, 11, 14, 15, 18, 23, 24, 26, 37, 79, 88, 90, 92, 94, 95, 97, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 116, 117], "1": [2, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116, 117, 118, 119], "box": [2, 9, 10, 12, 13, 15, 16, 17, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 117], "4028234663852886e": 2, "38": [2, 101, 102], "4": [2, 11, 12, 14, 15, 16, 17, 18, 19, 21, 24, 26, 28, 29, 30, 31, 33, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 58, 61, 63, 64, 65, 67, 68, 69, 70, 77, 78, 80, 81, 82, 84, 85, 88, 89, 90, 92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116, 117, 119], "float32": [2, 10, 11, 12, 13, 15, 16, 17, 19, 21, 88, 89, 90, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "denot": [2, 93], "well": [2, 9, 31, 74, 92, 98, 101, 102, 109, 117], "high": [2, 3, 10, 11, 12, 13, 15, 19, 21, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109], "8000002e": 2, "00": 2, "4028235e": 2, "1887903e": 2, "01": [2, 20, 90, 98, 99, 102, 103, 104, 105, 106, 107, 116], "dtype": [2, 9, 10, 11, 12, 13, 15, 19, 90, 117], "low": [2, 10, 11, 12, 13, 19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109], "etc": [2, 9, 16, 69, 72, 76, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 117, 118], "determin": [2, 11, 24, 90, 92, 93, 94, 95, 96, 109, 113, 117, 118], "inf": [2, 19, 93, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "envspec": [2, 8, 16], "normal": [2, 11, 16, 18, 88, 89, 96, 98, 99, 103, 119], "finish": [2, 89, 90], "code": [2, 4, 9, 10, 14, 15, 16, 18, 19, 20, 92, 109, 116, 117, 119], "clean": 2, "up": [2, 10, 11, 15, 19, 24, 25, 27, 28, 29, 30, 31, 33, 34, 35, 37, 40, 43, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 57, 58, 61, 63, 68, 70, 71, 72, 74, 75, 78, 79, 80, 81, 84, 85, 88, 90, 97, 98, 101, 102, 106, 111, 112, 113, 114, 116, 117], "window": [2, 14, 44, 89, 117], "http": [2, 14, 16, 24, 89, 92, 111, 112, 113, 116, 117, 119], "connect": [2, 10, 92, 98, 99, 100, 106, 107, 108], "properti": [2, 9, 16, 118], "unwrap": [2, 16, 21, 92], "non": [2, 9, 12, 14, 113, 117, 118, 119], "wrap": [2, 7, 8, 14, 15, 16, 18, 19, 20, 21, 117, 119], "_np_random": 2, "meth": 2, "much": [2, 24, 50, 51, 52, 53, 54, 58, 59, 102, 117, 118], "creat": [2, 8, 11, 13, 14, 15, 18, 21, 34, 88, 89, 90, 105, 106, 116, 119], "creation": [2, 15, 117], "tutori": [2, 21, 23, 116, 119], "gymnasium": [3, 7, 8, 9, 10, 11, 12, 13, 14, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114, 116, 118, 119], "env": [3, 4, 7, 8, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 112, 113, 114, 115, 116, 118, 119], "flexibl": [3, 15, 109], "implement": [3, 9, 10, 15, 17, 18, 19, 20, 21, 22, 23, 24, 96, 103, 109, 110, 114, 117, 119], "complic": [3, 11, 16], "parallel": [3, 15], "propos": [3, 109], "funcenv": 3, "part": [3, 18, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 118], "its": [3, 14, 15, 17, 18, 39, 46, 69, 81, 86, 90, 96, 97, 107, 109, 119], "own": [3, 15, 23, 39, 74], "relat": [3, 119], "larg": [3, 15, 16, 23, 95, 98, 99, 100, 101, 102, 105, 106, 107, 108, 109], "believ": 3, "improv": [3, 15], "arbitrarili": 3, "complex": [3, 9, 10, 101, 102, 103, 104, 119], "rl": [3, 14, 18, 115, 116, 118, 119], "advanc": [3, 15, 92], "becom": [3, 73, 87, 118], "were": [3, 19, 23, 41, 87, 92, 117], "mind": 3, "jax": [3, 109], "pytorch": [3, 119], "data": [3, 9, 12, 14, 16, 23, 116, 117, 119], "With": [3, 112, 116], "hardwar": 3, "acceler": [3, 89, 94, 95, 96], "brax": [3, 109], "written": [3, 14, 16, 23], "similar": [3, 10, 23, 28, 39, 105, 117], "program": [3, 15], "game": [3, 11, 14, 18, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 63, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 87, 111, 112, 113, 116, 117], "town": 3, "anymor": 3, "upgrad": 3, "jumpi": 3, "torch": [3, 119], "project": [3, 21, 23, 109, 116], "like": [3, 4, 9, 11, 14, 16, 17, 18, 19, 20, 21, 26, 27, 28, 29, 30, 31, 32, 33, 35, 37, 39, 40, 44, 46, 47, 48, 49, 58, 61, 63, 64, 65, 66, 67, 68, 69, 70, 75, 77, 78, 80, 81, 82, 84, 85, 88, 90, 98, 99, 101, 102, 104, 105, 106, 108, 114, 117], "supersuit": 3, "aim": [3, 56, 100, 103, 107, 108, 119], "bring": 3, "detail": [3, 9, 14, 18, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 109, 117], "caus": [3, 18, 21, 57, 114], "ad": [3, 16, 18, 19, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 114, 117], "v28": 3, "rewrit": 3, "vectorenv": [3, 9], "inherit": [3, 9, 16, 17, 19, 20, 21, 117], "vectoris": [3, 9, 109], "old": [3, 15, 16, 18, 22, 115], "tree": [3, 75], "structur": [3, 4, 9, 10, 12, 117], "transformobserv": [3, 16, 19], "lambdaobservationv0": [3, 7], "vectorlambdaobserv": 3, "No": [3, 18, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 119], "filterobserv": [3, 16, 19], "vectorfilterobserv": 3, "ye": 3, "flattenobserv": [3, 10, 16, 19, 117], "vectorflattenobserv": 3, "grayscaleobserv": [3, 16, 19], "vectorgrayscaleobserv": 3, "pixelobservationwrapp": [3, 16, 19], "pixelobserv": 3, "vectorpixelobserv": 3, "resizeobserv": [3, 16, 19], "vectorresizeobserv": 3, "Not": [3, 18], "reshapeobserv": 3, "vectorreshapeobserv": 3, "rescaleobserv": 3, "vectorrescaleobserv": 3, "dtypeobserv": 3, "vectordtypeobserv": 3, "normalizeobserv": [3, 16, 19], "vectornormalizeobserv": 3, "timeawareobserv": [3, 16, 19, 21], "vectortimeawareobserv": 3, "framestack": [3, 16, 18], "framestackobserv": 3, "vectorframestackobserv": 3, "delayobserv": 3, "vectordelayobserv": 3, "ataripreprocess": [3, 16, 18], "lambdaactionv0": [3, 7], "vectorlambdaact": 3, "clipact": [3, 16, 17, 21], "vectorclipact": 3, "rescaleact": [3, 16, 17, 21], "vectorrescaleact": 3, "nanact": 3, "vectornanact": 3, "stickyact": 3, "vectorstickyact": 3, "transformreward": [3, 16, 20], "lambdarewardv0": [3, 7], "vectorlambdareward": 3, "cliprewardv0": [3, 7], "vectorclipreward": 3, "rescalereward": 3, "vectorrescalereward": 3, "normalizereward": [3, 16, 20], "vectornormalizereward": 3, "autoresetwrapp": [3, 8, 16, 18, 117], "autoreset": [3, 8, 15, 117], "vectorautoreset": 3, "passiveenvcheck": [3, 18, 21], "vectorpassiveenvcheck": 3, "orderenforc": [3, 16, 18, 21, 117], "vectororderenforc": 3, "envcompat": [3, 16, 18, 22, 23], "shimmi": 3, "recordepisodestatist": [3, 16, 18, 23, 116, 119], "vectorrecordepisodestatist": 3, "vectorrendercollect": 3, "humanrend": [3, 16, 18], "jaxtonumpi": 3, "vectorjaxtonumpi": 3, "jaxtotorch": 3, "vectorjaxtotorch": 3, "vectorlistinfo": [3, 15, 16, 18], "These": [3, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 97, 98, 101, 107, 116, 119], "28": [3, 24, 33, 39, 92, 101, 102], "templat": 4, "meant": 4, "stateless": 4, "manner": [4, 11, 16, 19, 56], "being": [4, 8, 12, 18, 45, 94, 95, 96, 98, 101, 102, 106, 116], "around": [4, 18, 34, 87, 106, 109], "explicitli": [4, 117, 118], "That": [4, 93], "said": [4, 98, 100, 101, 108], "noth": [4, 89, 90, 119], "here": [4, 14, 92, 117], "prevent": [4, 11, 15, 47, 109], "statefulli": 4, "just": [4, 16, 21, 50, 56, 73, 104, 106], "recommend": [4, 8, 15, 18, 23, 24, 50, 51, 52, 53, 54, 90, 98, 101, 102, 116, 117], "consist": [4, 11, 16, 19, 21, 24, 37, 88, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 116, 117, 119], "method": [4, 10, 14, 17, 18, 19, 20, 22, 117, 119], "pomdp": 4, "given": [4, 8, 11, 16, 19, 71, 74, 88, 90, 91, 92, 94, 95, 98, 100, 101, 108, 116, 118], "transit": [4, 14, 21, 24, 50, 51, 52, 53, 54, 101, 102, 112, 113, 114, 118], "next_stat": [4, 116], "state_info": 4, "step_info": 4, "serv": [4, 9, 98, 99, 100, 101, 107, 108, 119], "purpos": [4, 9, 119], "allow": [4, 7, 8, 9, 10, 14, 16, 21, 22, 23, 24, 55, 73, 92, 93, 94, 95, 96, 103, 104, 105, 106, 109, 117, 119], "constant": [4, 35, 74, 90, 95, 98, 100, 101, 108], "them": [4, 9, 16, 18, 22, 23, 24, 26, 27, 28, 31, 32, 36, 40, 47, 68, 77, 90, 99, 106, 114], "itself": [4, 12, 15, 16, 18, 21, 22], "moment": [4, 74], "predominantli": 4, "futur": [4, 80, 109], "intend": [4, 18, 113], "flesh": 4, "offici": 4, "expos": 4, "statetyp": 4, "rewardtyp": 4, "terminaltyp": 4, "full": [4, 21, 24, 50, 51, 52, 53, 54, 89, 90, 116], "transform": [4, 9, 12, 14, 16, 17, 18, 106], "func": [4, 7, 12], "callabl": [4, 7, 8, 13, 14, 15, 18, 19, 20], "render_imag": 4, "render_st": 4, "renderstatetyp": 4, "show": [4, 19, 23, 24, 34, 40, 111, 116, 119], "render_init": 4, "kwarg": [4, 8, 14, 15, 22, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 117], "render_clos": 4, "autoclass": 4, "gymasnium": 4, "experiment": [7, 92], "argtyp": 7, "constructor": [7, 8, 9, 10, 11, 14, 16, 17, 19, 20, 21, 117], "environ": [7, 9, 11, 13, 16, 17, 19, 20, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 110, 111, 112, 113, 114, 118, 119], "lambdaact": 7, "_": [7, 13, 14, 15, 16, 21, 115], "rew": [7, 14, 118], "min_reward": [7, 20], "union": [7, 8, 10, 11, 12, 13, 14, 15, 17, 19], "float": [7, 8, 11, 12, 14, 16, 17, 19, 20, 24, 55, 68, 90, 98, 99, 100, 101, 107, 108, 116, 117, 119], "max_reward": [7, 20], "clip": [7, 16, 20, 21, 94, 95, 98, 101, 117], "between": [7, 10, 11, 18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 116, 117, 118, 119], "upper": [7, 11, 21, 101, 102], "lower": [7, 11, 21, 98, 99, 100, 101, 102, 105, 106, 107, 108, 116], "5": [7, 10, 11, 12, 13, 17, 18, 24, 26, 28, 29, 30, 31, 34, 35, 37, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 65, 67, 68, 70, 77, 78, 80, 81, 82, 84, 85, 88, 89, 90, 92, 94, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 114, 116, 117, 119], "cliprewardsv0": 7, "higher": [7, 88], "load": 8, "pre": [8, 113], "sever": [8, 11, 16, 18, 21, 23, 24, 54, 109], "id": [8, 15, 113, 117], "liter": 8, "mountaincar": [8, 94], "mountaincarcontinu": [8, 95], "pendulum": [8, 15, 19, 21, 91, 92, 93, 97, 119], "acrobot": [8, 91], "lunarland": [8, 18, 21, 23, 90, 115], "v2": [8, 17, 18, 21, 23, 88, 89, 90, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 114, 115], "lunarlandercontinu": [8, 17], "bipedalwalk": [8, 16, 17, 21, 88], "v3": [8, 16, 17, 21, 88, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 114], "bipedalwalkerhardcor": 8, "carrac": [8, 14, 19, 89], "blackjack": [8, 21, 110], "frozenlak": [8, 14, 113], "frozenlake8x8": 8, "cliffwalk": [8, 112], "taxi": [8, 110], "reacher": [8, 16, 97, 105], "v4": [8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 119], "pusher": [8, 97], "invertedpendulum": [8, 97, 103, 104, 119], "inverteddoublependulum": [8, 103], "halfcheetah": [8, 97, 99], "hopper": [8, 97, 108], "swimmer": [8, 97], "walker2d": [8, 97], "ant": [8, 97, 100, 108], "humanoidstandup": [8, 97, 102], "humanoid": [8, 45, 97, 98], "accord": [8, 10, 11, 15, 90], "find": [8, 24, 25, 50, 51, 52, 53, 54, 60, 69, 81, 103, 106, 117], "avail": [8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 109, 111, 112, 117], "modul": [8, 13, 117, 119], "eg": [8, 14, 117], "max_episode_step": [8, 18, 117], "length": [8, 10, 11, 14, 16, 18, 19, 88, 92, 93, 94, 95, 99, 107, 109, 113, 114, 116], "apply_api_compat": [8, 18, 22], "stepapicompat": [8, 16, 18, 22], "argument": [8, 9, 10, 11, 12, 14, 15, 19, 21, 22, 87, 91, 110, 116, 117], "fals": [8, 14, 15, 18, 19, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 90, 98, 99, 100, 101, 107, 108, 111, 116, 117, 119], "disable_env_check": [8, 15], "checker": [8, 15], "addit": [8, 9, 15, 16, 18, 21, 23, 24, 30, 41, 71, 75, 90, 91, 92, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 114, 116, 117, 119], "rais": [8, 11, 12, 13, 14, 15, 18, 19, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "error": [8, 11, 12, 14, 16, 18, 116, 118], "entry_point": [8, 117], "reward_threshold": [8, 98, 99, 100, 101, 102, 105, 106, 107, 108, 117], "nondeterminist": [8, 117], "order_enforc": [8, 117], "syntax": 8, "namespac": [8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 117], "env_nam": [8, 22], "v": [8, 73, 94, 103], "keyword": [8, 10, 15, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 111, 116, 117], "entri": 8, "point": [8, 12, 14, 16, 24, 27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 45, 46, 47, 48, 49, 51, 55, 56, 59, 66, 67, 68, 69, 70, 71, 72, 74, 76, 77, 78, 80, 81, 84, 88, 89, 90, 92, 93, 96, 106, 111, 118], "threshold": [8, 92, 93, 114, 117], "consid": [8, 19, 89, 90, 91, 97, 98, 100, 101, 108, 117], "learnt": 8, "knowledg": 8, "limit": [8, 21, 40, 48, 55, 56, 69, 74, 103, 104, 116, 119], "enabl": [8, 16, 24, 89, 109], "order": [8, 9, 10, 16, 21, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 117], "enforc": 8, "correct": [8, 114, 117, 118], "disabl": [8, 18, 113], "pprint_registri": 8, "onli": [8, 9, 10, 11, 12, 15, 16, 17, 18, 19, 23, 24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 61, 63, 64, 65, 67, 68, 70, 71, 72, 73, 74, 75, 77, 78, 80, 81, 82, 84, 85, 94, 95, 98, 99, 100, 101, 103, 105, 106, 108, 109, 116, 117], "env_id": [8, 22], "retriev": [8, 18, 45, 48, 74], "global": 8, "_registri": 8, "num_col": 8, "exclude_namespac": 8, "disable_print": 8, "column": [8, 119], "arrang": 8, "exclud": [8, 98, 99, 100, 101, 107, 108], "instead": [8, 15, 19, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 92, 108, 117], "consol": [8, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "npt": [9, 10, 11], "dtypelik": 9, "superclass": [9, 17, 19, 20], "crucial": 9, "thei": [9, 15, 18, 19, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 106, 110, 111, 112, 113, 117], "variou": [9, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 102, 109, 119], "clearli": 9, "interact": [9, 14, 24, 109, 116, 117], "look": [9, 14, 16, 18, 20, 21, 24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 58, 61, 63, 64, 65, 67, 68, 70, 73, 75, 77, 78, 80, 81, 82, 84, 85, 117, 118], "u": [9, 16, 20, 24, 116, 117, 119], "work": [9, 14, 16, 18, 19, 24, 89, 90, 92, 99, 100, 103, 104, 108], "highli": [9, 23, 24, 87, 91, 109, 117], "form": [9, 10, 11, 18, 92, 107, 117], "painlessli": 9, "flat": [9, 10, 11, 12, 19], "sampl": [9, 10, 11, 12, 13, 14, 15, 19, 20, 21, 23, 90, 114, 115, 116, 117, 119], "especi": [9, 20, 117], "hierarch": [9, 114], "via": [9, 10, 16, 18, 19, 20, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 91, 97, 109, 110, 117, 119], "build": [9, 16, 26, 44, 48, 103, 108], "express": [9, 14, 98, 101, 102], "cover": [9, 116], "parametr": [9, 119], "probabl": [9, 24, 112, 113, 114, 116, 118, 119], "distribut": [9, 10, 11, 107, 109, 113, 119], "batch": [9, 13, 15], "moreov": [9, 18, 24, 27, 37, 117], "handl": [9, 15, 103, 111, 116], "care": [9, 75], "immut": 9, "mask": [9, 10, 11, 23, 114], "t_cov": 9, "randomli": [9, 10, 90, 113, 117], "uniform": [9, 11, 12, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "bounded": 9, "int8": [9, 11], "member": [9, 58], "possibli": [9, 10, 11, 13, 16, 18, 21, 109], "subspac": [9, 10, 11, 12], "to_json": 9, "sample_n": 9, "jsonabl": 9, "from_json": 9, "matric": [9, 109], "multidiscret": [9, 10, 12, 13, 15, 21, 117], "binari": [9, 11, 21, 117], "hold": [9, 111, 116], "down": [9, 11, 24, 28, 30, 31, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 57, 58, 61, 63, 65, 66, 68, 70, 78, 80, 81, 84, 85, 89, 102, 111, 112, 113, 114, 116, 117, 118], "button": [9, 11, 14, 21], "multibinari": [9, 10, 12, 13, 21], "multipl": [9, 10, 11, 13, 15], "ax": [9, 11, 116, 117], "messag": 9, "mission": [9, 57, 59, 60], "join": 9, "togeth": [9, 24, 97], "separ": [9, 10, 23, 117], "readabl": [9, 10], "fix": [9, 10, 11, 16, 18, 20, 21, 23, 57, 92, 93, 96, 97, 98, 99, 100, 101, 103, 104, 108, 111, 113, 117, 119], "unord": 9, "entiti": 9, "select": [9, 11, 47, 98, 101, 102, 105, 106], "graph": [9, 12, 21], "node": [9, 10, 12], "edg": [9, 10, 12, 93], "flatten": [9, 12, 16, 97, 116, 117], "unflatten": [9, 12], "neural": [9, 12, 92, 107, 109, 119], "network": [9, 12, 107], "flatdim": [9, 12], "dimens": [9, 11, 12, 19, 98, 99, 100, 101, 107, 108, 109, 119], "flatten_spac": [9, 12], "revers": [9, 12, 111, 119], "size": [9, 18, 113, 117], "batch_spac": [9, 13], "concaten": [9, 12, 13, 97], "iter": [9, 10, 13, 15], "create_empty_arrai": [9, 13], "create_shared_memori": [9, 13], "read_from_shared_memori": [9, 13], "write_to_shared_memori": [9, 13], "spaces_kwarg": 10, "constitu": 10, "usag": [10, 11, 12, 16, 89], "ordereddict": [10, 13, 19], "nest": [10, 13, 109], "ext_control": 10, "inner_st": 10, "charg": 10, "100": [10, 12, 18, 38, 48, 71, 72, 88, 89, 90, 92, 95, 100, 105, 112, 113], "system_check": 10, "10": [10, 11, 17, 24, 31, 37, 50, 51, 52, 53, 54, 61, 68, 71, 74, 88, 90, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 111, 112, 114, 116, 117, 119], "job_statu": 10, "progress": [10, 80], "conveni": [10, 16, 21, 117], "easili": [10, 16], "deal": 10, "instanti": [10, 14, 18, 19, 20, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 117], "either": [10, 11, 12, 14, 18, 21, 22, 24, 47, 57, 94, 95, 111, 113, 119], "avoid": [10, 13, 16, 21, 24, 27, 28, 30, 35, 36, 44, 46, 62, 63, 65, 70, 72, 73, 78, 112, 114], "independ": [10, 11, 15, 100, 106, 107, 108], "same": [10, 12, 14, 15, 19, 56, 88, 89, 92, 105, 106, 107, 114, 116, 118], "attr": 10, "warn": [10, 14, 15, 18], "guarante": [10, 24], "uniqu": [10, 87, 91, 97, 103], "sub": [10, 15, 74], "precis": 10, "cartesian": [10, 11, 96], "product": [10, 11], "03633198": 10, "42370757": 10, "involv": [10, 87, 103, 104, 109, 112, 113, 114, 117, 119], "reproduc": [10, 23], "draw": [10, 111, 116, 117], "42": [10, 11, 93, 101, 102, 115], "54": 10, "finit": [10, 11, 17, 98, 102, 103, 104, 105, 106, 108, 118, 119], "a_0": 10, "dot": [10, 11, 117], "a_n": 10, "a_i": 10, "belong": [10, 13], "n": [10, 11, 12, 13, 21, 24, 43, 89, 92, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 116, 119], "0259352": 10, "80977976": 10, "80066574": 10, "77165383": 10, "must": [10, 12, 13, 14, 15, 16, 17, 18, 19, 21, 23, 24, 25, 26, 29, 31, 32, 33, 34, 36, 40, 41, 42, 45, 48, 49, 58, 62, 64, 65, 70, 89, 100, 108, 117, 118], "length_mask": 10, "sample_mask": 10, "drawn": [10, 11, 105, 107, 111], "geometr": 10, "featur": [10, 11, 109], "feature_spac": 10, "node_spac": [10, 12], "edge_spac": [10, 12], "seri": [10, 21], "adjac": 10, "matrix": 10, "edge_link": [10, 12], "num_nod": 10, "num_edg": 10, "graphinst": [10, 12], "don": [10, 16, 23, 24, 40, 50, 51, 52, 53, 54, 74, 89, 94, 117, 118], "edge_mask": 10, "multipli": [10, 95], "attribut": [10, 21, 23, 105, 106, 117], "unbound": 11, "mathbb": 11, "interv": [11, 21, 98, 100, 101, 108], "There": [11, 16, 21, 56, 57, 69, 88, 90, 91, 94, 95, 97, 102, 103, 104, 105, 106, 109, 112, 114, 117], "common": [11, 16, 19, 21, 118, 119], "ident": [11, 15, 19], "construct": [11, 24, 50, 51, 52, 53, 54, 92, 98, 99, 100, 101, 107, 108], "scalar": [11, 17], "respect": [11, 15, 16, 18, 21, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 90, 92, 98, 101, 102, 107], "assum": [11, 19, 117], "across": [11, 13, 30, 40, 51, 52, 55], "infer": [11, 97], "essenti": 11, "valueerror": [11, 12, 13, 15, 18, 19], "coordin": [11, 16, 19, 88, 90, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108], "shift": [11, 21], "exponenti": [11, 16, 20], "unsupport": 11, "is_bound": 11, "both": [11, 15, 18, 19, 21, 22, 88, 91, 92, 106, 108, 109, 111, 112, 113, 114, 117, 118, 119], "sens": [11, 109], "One": [11, 21, 98, 101, 102], "neither": [11, 18, 111], "nor": [11, 18, 111, 112], "mani": [11, 18, 19, 21, 24, 30, 33, 37, 56, 59, 74, 84, 116, 117], "subset": [11, 17, 24, 50, 51, 52, 53, 54, 117], "smallest": 11, "maskndarrai": 11, "uniformli": [11, 24, 92, 93, 105, 106, 117], "infeas": 11, "sort": 11, "fair": 11, "coin": 11, "toss": 11, "per": [11, 15, 37, 56, 79, 114, 118], "nvec": 11, "int64": [11, 12], "keyboard": [11, 14], "alwai": [11, 12, 18, 24, 90, 94, 95, 98, 101, 102, 105, 107, 111, 112, 113, 114, 117], "noop": [11, 14, 18, 24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 114], "nintendo": 11, "conceptu": 11, "arrow": [11, 68], "left": [11, 24, 26, 28, 29, 30, 31, 35, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 57, 58, 61, 63, 64, 65, 67, 70, 74, 75, 77, 78, 80, 81, 84, 85, 88, 89, 90, 93, 94, 98, 101, 102, 103, 104, 108, 112, 113, 114, 116, 117, 119], "param": 11, "min": [11, 17, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111], "max": [11, 17, 18, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 113, 116, 119], "press": [11, 14, 21, 89, 92], "although": 11, "rare": 11, "d": [11, 14, 92, 105, 106], "categor": 11, "vector": [11, 14, 16, 88, 90, 102, 103, 104, 105, 106, 119], "count": [11, 88, 90, 111, 116], "kind": 11, "unless": [11, 16, 111, 112, 113, 114, 117], "max_length": 11, "min_length": 11, "charset": 11, "alphanumer": 11, "compris": 11, "charact": [11, 14, 58, 69], "b5": 11, "hello": 11, "0123456789": 11, "digit": [11, 109], "inclus": [11, 24], "empti": [11, 13, 18, 74, 116, 119], "english": 11, "alphabet": 11, "plu": [11, 40, 112], "latin": 11, "charlist": 11, "zero": [11, 13, 96, 99, 109, 116, 117, 118, 119], "matter": 11, "equival": [12, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "would": [12, 17, 19, 20, 98, 99, 100, 101, 102, 107, 108, 115, 117], "notimplementederror": 12, "cannot": [12, 13, 18, 21, 23, 112, 117, 118], "attempt": [12, 90, 102, 103, 114], "compound": 12, "oper": [12, 18], "boundari": 12, "while": [12, 23, 24, 27, 28, 44, 59, 62, 63, 64, 65, 68, 70, 72, 74, 78, 81, 83, 90, 92, 93, 96, 98, 99, 101, 102, 105, 106, 107, 111, 112, 116, 117, 118, 119], "exactli": [12, 107], "origin": [12, 15, 17, 18, 19, 23, 89, 92, 103, 105, 106], "effect": [12, 13, 16, 18, 19, 21, 24, 50, 51, 52, 53, 54, 90, 103, 104, 114, 116, 119], "necessarili": 12, "hot": 12, "encod": [12, 114, 117], "60": [12, 58, 71, 109], "recurs": 12, "6": [12, 24, 28, 29, 30, 31, 35, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 65, 79, 80, 81, 84, 85, 92, 94, 95, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 112, 114, 119], "12": [12, 24, 31, 33, 37, 39, 50, 51, 52, 53, 54, 58, 61, 73, 90, 92, 93, 98, 99, 100, 101, 102, 105, 108, 111, 112, 116], "int32": 12, "15": [12, 13, 24, 47, 50, 51, 52, 53, 54, 58, 77, 90, 98, 99, 101, 102, 105, 108, 109, 113], "k": [12, 14, 18, 90, 107], "m": [12, 24, 43, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 117], "match": [12, 15, 17, 79], "copi": [13, 15, 117], "item": [13, 14, 109, 116], "6348213": 13, "28607962": 13, "60760117": 13, "87383074": 13, "192658": 13, "2148103": 13, "99644893": 13, "08304597": 13, "7238421": 13, "35848552": 13, "1533453": 13, "67958736": 13, "49076623": 13, "38661423": 13, "7975036": 13, "93317133": 13, "stopiter": 13, "fn": 13, "multi_binari": 13, "built": [13, 23, 109], "multi_discret": 13, "ctx": 13, "mp": 13, "multiprocess": [13, 15], "opt": 13, "hostedtoolcach": 13, "9": [13, 15, 24, 28, 31, 36, 45, 50, 51, 52, 53, 54, 58, 61, 71, 80, 85, 92, 96, 98, 99, 100, 101, 102, 103, 105, 106, 108, 111, 116], "x64": 13, "lib": [13, 112], "python3": 13, "process": [13, 14, 15, 19, 21, 92, 105, 117, 118], "eventu": 13, "shared_memori": [13, 15], "customspaceerror": 13, "read": [13, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "forward": [13, 35, 57, 88, 98, 99, 100, 101, 102, 107, 108, 119], "vice": [13, 18], "versa": [13, 18], "side": [13, 19, 26, 39, 54, 56, 90], "write": [13, 15, 117], "num_env": [13, 15], "plai": [14, 21, 34, 47, 60, 79, 84, 89, 109, 116, 117], "transpos": [14, 117], "zoom": 14, "callback": 14, "keys_to_act": 14, "w": [14, 98, 101, 102], "7": [14, 24, 28, 30, 31, 35, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 65, 80, 81, 84, 85, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108], "dw": 14, "particularli": [14, 18, 93], "verifi": 14, "level": [14, 21, 24, 31, 48, 70, 78, 109], "preprocess": [14, 16], "unplay": 14, "wish": [14, 19, 23], "real": [14, 56, 99], "statist": [14, 119], "playplot": 14, "last": [14, 18, 46, 47, 57, 99, 102, 105, 106, 117, 118], "150": 14, "def": [14, 16, 17, 19, 20, 116, 117, 119], "obs_t": 14, "obs_tp1": 14, "plotter": 14, "render_fp": [14, 18, 117], "30": [14, 18, 24, 68, 71, 101, 102], "amount": [14, 44, 46, 47, 49, 55, 74, 88, 93, 103, 104, 119], "input": [14, 15, 21, 116], "receiv": [14, 15, 21, 34, 37, 41, 44, 45, 51, 57, 60, 89, 90, 95, 108, 114, 116, 118, 119], "map": [14, 19, 21, 42, 113, 114, 116, 117, 119], "unicod": 14, "suppos": 14, "trigger": [14, 114], "key_to_act": 14, "ord": [14, 117], "unknown": [14, 109], "horizon_timestep": 14, "plot_nam": 14, "live": [14, 27, 30, 33, 34, 36, 39, 44, 45, 48, 55, 59, 60, 66, 72, 77, 116], "compute_metr": 14, "obs_tp": 14, "cumulative_reward": 14, "linalg": [14, 117], "norm": [14, 105, 106, 117], "along": [14, 16, 21, 22, 58, 59, 61, 72, 89, 93, 94, 95, 99, 103, 104, 107, 112], "conjunct": 14, "evolv": 14, "200": [14, 49, 72, 90, 92, 93, 94, 96, 113, 114], "immedi": [14, 16, 20, 111, 117], "cumul": [14, 16, 18], "magnitud": [14, 90, 95, 103, 104, 119], "your_env": 14, "len": [14, 17, 116], "horizon": [14, 74, 100, 108, 118], "titl": [14, 94, 95, 116, 119], "dependencynotinstal": [14, 18], "matplotlib": [14, 116, 119], "playablegam": 14, "process_ev": 14, "event": [14, 117], "particular": [14, 16, 19, 21, 22, 90, 118], "keep": [14, 16, 18, 32, 45, 64, 67, 75, 76, 84, 93, 102, 117], "track": [14, 16, 18, 76, 89, 93, 98, 99, 100, 101, 102, 103, 104, 107, 108], "exit": [14, 15], "save_video": 14, "video_fold": [14, 18], "episode_trigg": [14, 18], "step_trigg": [14, 18], "video_length": [14, 18], "name_prefix": [14, 18], "episode_index": 14, "step_starting_index": 14, "extract": 14, "compos": 14, "record": [14, 16, 88, 119], "store": [14, 15, 18, 119], "iff": [14, 18, 117], "isn": 14, "entir": [14, 18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 100, 108, 109], "snippet": [14, 18], "captur": [14, 18, 83], "Will": [14, 18], "prepend": [14, 18], "filenam": [14, 18], "moviepi": [14, 18], "imagesequenceclip": 14, "durat": [14, 98, 100, 101, 102, 103, 104, 105, 106, 108, 119], "step_index": 14, "199": 14, "capped_cubic_video_schedul": 14, "episode_id": 14, "8": [14, 15, 19, 20, 22, 24, 26, 28, 30, 31, 33, 35, 39, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 80, 84, 85, 89, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 113, 119], "27": [14, 92, 98, 101, 102], "729": 14, "1000": [14, 18, 21, 72, 74, 89, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 115, 119], "2000": [14, 88, 114], "3000": 14, "schedul": [14, 113], "step_api_compat": [14, 22], "step_return": 14, "output_truncation_bool": [14, 18], "is_vector_env": 14, "doc": [14, 18, 90], "ob": [14, 16, 19, 114, 116, 119], "interfac": [14, 115], "conflict": [14, 109], "final": [14, 15, 18, 57, 116, 117, 118], "desir": [14, 107, 108, 114], "oldenv": 14, "vec_env": 14, "convert_to_terminated_truncated_step_api": [14, 22], "irrespect": 14, "convert_to_done_step_api": 14, "omit": [14, 97, 98, 99, 100, 101, 102, 107, 108], "env_check": 14, "check_env": 14, "skip_render_check": 14, "invas": [14, 78], "farama": [14, 16, 109, 116, 117, 119], "org": [14, 24, 116, 119], "content": 14, "environment_cr": [14, 117], "ignor": [14, 24, 111, 116], "skip": [14, 18, 24, 117], "ci": 14, "linear": [15, 90, 92, 103, 104, 107, 119], "speed": [15, 35, 88, 89], "taken": [15, 18, 48, 54, 91, 93, 117, 119], "wait": [15, 48, 50, 74, 118], "until": [15, 16, 47, 60, 105, 111, 112, 113, 117, 119], "overwritten": [15, 16], "final_observ": [15, 18], "final_info": [15, 18], "asyncvectorenv": 15, "syncvectorenv": 15, "single_observation_spac": 15, "single_action_spac": 15, "v25": [15, 23], "rememb": [15, 18, 89, 117], "share": [15, 119], "other": [15, 16, 17, 18, 19, 22, 30, 39, 42, 50, 56, 90, 96, 97, 99, 103, 105, 106, 108, 113, 114, 116, 117, 119], "word": [15, 105, 119], "02240574": 15, "03439831": 15, "03904812": 15, "02810693": 15, "01586068": 15, "01929009": 15, "02394426": 15, "04016077": 15, "01314174": 15, "03893502": 15, "02400815": 15, "0038326": 15, "00122802": 15, "16228443": 15, "02521779": 15, "23700266": 15, "00788269": 15, "17490888": 15, "03393489": 15, "31735462": 15, "04918966": 15, "19421194": 15, "02938497": 15, "29495203": 15, "releas": [15, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 117], "resourc": [15, 116, 117], "viewer": 15, "close_extra": 15, "synchron": 15, "asynchron": 15, "garbag": 15, "04456399": 15, "04653909": 15, "01326909": 15, "02099827": 15, "03073904": 15, "00145001": 15, "03088818": 15, "03131252": 15, "03468829": 15, "01500225": 15, "01230312": 15, "01825218": 15, "registri": [15, 21], "env_fn": 15, "context": [15, 119], "daemon": 15, "worker": [15, 68], "pipe": 15, "commun": 15, "lambda": [15, 19, 20, 116], "81": [15, 96], "62": 15, "8286432": 15, "5597771": 15, "90249056": 15, "85009176": 15, "5266346": 15, "60007906": 15, "back": [15, 16, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 98, 99], "effici": [15, 19, 94, 95, 103], "subprocess": 15, "flag": [15, 94, 109], "turn": [15, 18, 23, 27, 28, 89, 90, 103, 109], "quit": [15, 117], "head": [15, 99], "spawn": [15, 106], "children": 15, "overrid": [15, 16], "inner": 15, "logic": [15, 89, 117], "degre": [15, 19, 101, 102, 103], "chanc": 15, "shoot": [15, 31, 40, 42, 47, 48, 55, 56, 65, 68, 72, 77, 78, 86], "yourself": [15, 48, 68, 89, 116, 117], "foot": [15, 99, 100, 108], "thu": [15, 24, 50, 51, 52, 53, 54, 105, 106, 109], "_worker": 15, "_worker_shared_memori": 15, "runtimeerror": 15, "serial": 15, "modular": [16, 21, 109, 117], "behavior": [16, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 96, 98, 99, 100, 101, 102, 107, 108, 109, 117], "modif": [16, 105, 106], "without": [16, 21, 46, 101, 111, 113, 116, 117], "alter": [16, 21, 24, 117], "lot": [16, 21, 116, 119], "boilerpl": [16, 21, 117], "chain": [16, 21, 92, 107], "base_env": [16, 21], "wrapped_env": [16, 17, 18, 21, 117, 119], "min_act": [16, 17, 21], "max_act": [16, 17, 21], "access": [16, 18, 23, 55], "underneath": [16, 21, 93], "anoth": [16, 39, 101, 102, 104, 105, 106, 108, 114, 116, 118, 119], "get": [16, 21, 24, 44, 47, 48, 49, 56, 66, 67, 68, 69, 71, 72, 73, 78, 88, 90, 98, 100, 101, 103, 111, 116, 118], "layer": [16, 21, 119], "bare": 16, "box2d": [16, 21, 88, 89, 90], "bipedal_walk": [16, 21, 88], "0x7f87d70712d0": [16, 21], "three": [16, 24, 27, 30, 32, 45, 53, 59, 66, 71, 72, 73, 74, 98, 100, 101, 102, 107, 108, 117], "thing": [16, 19, 24], "do": [16, 18, 19, 20, 24, 37, 49, 70, 74, 75, 89, 90, 92, 98, 99, 100, 101, 107, 108, 117, 119], "Such": 16, "actionwrapp": [16, 17], "observationwrapp": [16, 19, 117], "rewardwrapp": [16, 20], "present": [16, 92, 109, 116, 117, 118], "section": [16, 24, 75, 98, 99, 100, 101, 107, 108, 116, 117], "found": [16, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 97, 109, 116, 119], "github": [16, 97, 112, 117], "com": [16, 112, 113, 117, 119], "foundat": [16, 109, 117], "forget": [16, 117], "wrapperacttyp": [16, 17], "wrapperobstyp": [16, 19], "commonli": [16, 21], "page": [16, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "descript": [16, 117], "misc": 16, "tp": 16, "atari": [16, 21, 22, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 116], "compat": [16, 19, 21, 109, 115], "21": [16, 22, 98, 101, 102, 105, 111, 116], "filter": 16, "request": [16, 111], "anobserv": 16, "stack": [16, 19], "roll": [16, 19, 37, 105], "grai": [16, 18], "scale": [16, 18, 20, 24, 90, 98, 99, 100, 101, 107, 108, 109], "center": [16, 19, 89, 90, 93, 96, 98, 99, 101, 102], "unit": [16, 19, 58, 92, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "varianc": [16, 19, 20], "averag": [16, 20, 101, 118, 119], "augment": [16, 19], "obtain": [16, 18, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 96, 111, 118, 119], "replac": [16, 23, 111, 116], "recordvideo": [16, 18, 23], "rollout": [16, 18, 114], "save": [16, 18, 23], "rescal": [16, 21], "axbxc": [16, 19], "resiz": [16, 18], "trajectori": [16, 19, 20, 90, 101, 102], "append": [16, 19, 116, 119], "th": 16, "sometim": [16, 20, 113, 117], "still": [16, 23, 24, 116], "let": [16, 17, 20, 24, 39, 109, 116, 117, 119], "penal": [16, 75], "energi": [16, 88, 90, 93, 109], "weight": [16, 98, 99, 100, 101, 105, 106, 107, 108, 109, 118, 119], "those": [16, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 92, 97, 98, 99, 100, 101, 102, 103, 104, 108], "nevertheless": 16, "reacherrewardwrapp": 16, "reward_dist_weight": 16, "reward_ctrl_weight": 16, "reward_dist": [16, 105, 106], "reward_ctrl": [16, 105, 106], "suffici": [16, 30, 32, 34, 36, 41, 116], "simpli": [17, 18, 19, 20, 24, 117], "overwrit": [17, 19, 20], "domain": [17, 89, 92, 94, 95, 114], "sai": [17, 18], "discreteact": 17, "disc_to_cont": 17, "act": [17, 116], "__name__": 17, "__main__": 17, "print": [17, 117, 119], "among": [17, 19, 91, 97], "biped": [17, 87, 101, 102], "walker": [17, 87, 97, 106, 108], "affin": [17, 90], "75": [17, 98], "noop_max": 18, "frame_skip": [18, 98, 99, 100, 101, 107, 108], "screen_siz": 18, "84": [18, 98, 101, 102], "terminal_on_life_loss": 18, "grayscale_ob": 18, "grayscale_newaxi": 18, "scale_ob": 18, "2600": [18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "guidelin": 18, "machado": [18, 24], "et": [18, 24], "al": [18, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 116], "2018": [18, 24, 92], "revisit": [18, 24], "arcad": [18, 24, 31, 48, 50, 51, 52, 53, 54, 109], "evalu": [18, 24, 116], "protocol": [18, 24], "open": [18, 24, 37, 97, 109, 117], "problem": [18, 24, 90, 93, 96, 103, 104, 107, 109, 111, 114, 115, 118], "stage": 18, "op": 18, "pool": [18, 107], "recent": [18, 19, 20, 22], "life": [18, 30, 44, 48, 72, 76, 119], "lost": [18, 33, 41, 60, 73, 77], "loss": [18, 111, 119], "off": [18, 23, 41, 56, 64, 72, 89, 90, 112, 114], "squar": [18, 19, 73, 105, 106, 114, 117], "210x180": 18, "84x84": 18, "grayscal": [18, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "colour": [18, 89], "greyscal": 18, "255": [18, 19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 89, 117], "frequenc": 18, "experi": [18, 98, 101, 102, 103, 104, 116, 119], "whenev": [18, 30, 33, 117], "channel": 18, "axi": [18, 94, 95, 99, 101, 102, 107, 116], "dimension": [18, 21, 28, 90, 98, 99, 100, 106, 107, 108, 117], "memori": [18, 19, 94, 95], "optim": [18, 24, 88, 90, 101, 102, 109, 116, 119], "benefit": 18, "opencv": 18, "new_ob": 18, "final_reward": 18, "final_termin": 18, "final_trunc": 18, "final_don": 18, "prior": 18, "alongsid": 18, "previou": [18, 98, 101, 102, 118], "re": [18, 56, 71, 74, 117, 119], "old_env": 18, "legacyenv": 18, "retun": 18, "modern": [18, 109], "convers": [18, 22, 109], "cartpoleenv": 18, "customenv": 18, "manual": [18, 21, 23, 24, 50, 51, 52, 53, 54], "unregist": 18, "surround": 18, "test": [18, 88, 109, 117, 119], "haven": 18, "screen": [18, 24, 26, 30, 34, 39, 40, 42, 51, 57, 63, 73, 74, 98, 99, 100, 101, 102, 103, 104, 107, 108], "nativ": 18, "nonativerend": 18, "disable_render_order_enforc": 18, "classic_control": [18, 23, 91], "resetneed": 18, "deque_s": [18, 116], "At": [18, 21, 33, 44, 47, 58], "_episod": 18, "l": [18, 107], "elaps": 18, "sinc": [18, 22, 24, 50, 51, 52, 53, 54, 87, 93, 97, 106, 109, 114, 117, 118], "begin": [18, 23, 30, 33, 46, 71, 72, 73, 74, 116, 117], "num": [18, 24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "buffer": [18, 19, 89], "return_queu": [18, 116, 119], "length_queu": [18, 116], "disable_logg": 18, "intermitt": 18, "hundredth": 18, "emploi": 18, "stop": [18, 21, 68, 78, 86, 111, 116, 118], "span": 18, "strictli": 18, "logger": 18, "pop_fram": 18, "reset_clean": 18, "clear": [18, 78], "issu": [18, 21, 23, 24, 98, 100, 101, 102, 108, 117], "place": [18, 28, 93, 94, 95, 117], "\u01f9one": 18, "outermost": 18, "actual": [18, 114, 117], "_k": 18, "classic": [18, 21, 23, 90, 92, 93, 94, 95, 96, 100, 104, 107, 108, 118], "reflect": [19, 93], "2d": [19, 106], "navig": [19, 33, 69, 114, 117], "agent_posit": 19, "target_posit": 19, "throw": [19, 59], "awai": [19, 27, 67, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "freedom": [19, 101, 102, 103], "target": [19, 40, 92, 105, 106, 117, 118], "rel": [19, 92, 101, 102, 117], "relativeposit": [19, 117], "f": [19, 20, 116, 119], "ideal": 19, "subclass": 19, "accordingli": [19, 74, 117], "incorrectli": [19, 118], "randn": 19, "08319338": 19, "04635121": 19, "07394746": 19, "20877492": 19, "filter_kei": 19, "00067088": 19, "01860439": 19, "04772898": 19, "01911527": 19, "04560107": 19, "04466959": 19, "0328232": 19, "02367178": 19, "04649447": 19, "14996664": 19, "03329664": 19, "25847703": 19, "96": [19, 24, 89], "27648": 19, "num_stack": 19, "lz4_compress": 19, "lazyfram": 19, "fill": [19, 33, 117], "lz4": 19, "compress": 19, "keep_dim": 19, "uint8": [19, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "singleton": 19, "axbx1": 19, "axb": 19, "epsilon": [19, 20, 116], "1e": [19, 20, 101, 107, 108, 119], "past": [19, 20], "newli": [19, 20], "stabil": [19, 20, 101, 102, 119], "pixels_onli": 19, "render_kwarg": 19, "pixel_kei": 19, "choos": [19, 117], "odict_kei": 19, "400": [19, 114], "600": 19, "discard": 19, "assertionerror": 19, "typeerror": 19, "unexpect": 19, "64": [19, 24], "03810719": 19, "03522411": 19, "02231044": 19, "01088205": 19, "03881167": 19, "16021058": 19, "0220928": 19, "28875574": 19, "becaus": [20, 23, 116, 117], "intrins": 20, "gain": [20, 34, 70, 76, 77, 80], "numer": [20, 102, 103, 104, 111, 119], "clipreward": 20, "invari": 20, "incorrect": [20, 114, 118], "gamma": [20, 118, 119], "99": [20, 119], "discount": [20, 116, 118, 119], "factor": [20, 116, 119], "mountain": [21, 91], "car": [21, 33, 49, 87, 91, 109], "four": [21, 33, 44, 89, 90, 98, 100, 108, 114, 116], "introduc": [21, 22, 23, 98, 101, 102], "core": 21, "markov": [21, 118], "decis": [21, 23, 109, 118], "theori": [21, 96, 103], "perfect": 21, "reconstruct": 21, "miss": [21, 75, 92, 114], "compon": [21, 117], "veri": [21, 90, 105, 117], "easi": [21, 60, 110], "loop": [21, 23, 109, 116], "pictur": 21, "simplifi": [21, 96], "someth": 21, "spaceship": [21, 31, 45, 76], "land": [21, 38, 72, 90], "safe": [21, 68, 90], "document": [21, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 91, 98, 101, 102, 103, 110, 116, 117], "imagin": [21, 109], "robot": [21, 23, 36, 86, 88, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 118], "destroi": [21, 27, 29, 31, 32, 33, 34, 35, 36, 39, 40, 41, 42, 45, 46, 54, 60, 71, 72, 73, 76, 77, 78, 80, 90], "enemi": [21, 28, 29, 32, 34, 35, 36, 42, 45, 46, 48, 61, 70, 71, 73, 74, 76, 77, 78, 80, 86], "exchang": 21, "crash": [21, 90], "succeed": 21, "similarli": [21, 90], "restart": 21, "train": [21, 23], "major": 21, "our": [21, 116, 117], "simpl": [21, 88, 110, 115, 118, 119], "util": [21, 22, 117], "coupl": 21, "nich": 21, "li": [21, 109], "lie": 21, "aspect": [21, 118], "regist": [22, 24], "sole": 22, "special": [22, 27, 57, 119], "gymv26environ": 22, "relev": [22, 117], "pong": [22, 24, 39, 43], "v5": [22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "signific": 22, "introduct": [22, 92, 111, 112], "signatur": 22, "previous": [22, 24, 33], "backward": [22, 99, 119], "compliant": [22, 23], "oldv21env": 22, "break": [23, 31, 39, 89], "briefli": 23, "outlin": [23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 111, 116], "stuck": [23, 27, 36, 55], "123": 23, "emul": [23, 24], "awar": 23, "randint": 23, "utilis": 23, "contrast": 23, "older": [23, 97], "definit": [23, 98, 100, 101, 118], "expand": [23, 24, 50, 51, 52, 53, 54], "blog": 23, "post": [23, 32], "soon": [23, 117], "extra": [23, 28, 33, 34, 36, 40, 42, 55, 74, 109, 116, 117], "address": 23, "associ": 23, "librari": [23, 115, 117], "primari": 23, "shouldn": [23, 117], "happen": [23, 73, 94, 95, 98, 100, 101, 102, 103, 104, 105, 106, 108, 111, 113, 114, 118], "fly": [23, 26, 31, 55, 71, 90], "shown": [23, 59, 89, 92, 118], "explan": [23, 116, 119], "summari": 23, "goalenv": 23, "reimplement": 23, "system": [23, 54, 92, 96, 103, 104, 109], "monitor": 23, "stella": 24, "adventur": [24, 43], "air": [24, 43], "raid": [24, 43], "alien": [24, 43, 45, 65, 78], "amidar": [24, 32, 43], "assault": [24, 43], "asterix": [24, 43], "asteroid": [24, 43], "atlanti": [24, 43], "licens": [24, 109, 116, 119], "download": [24, 116, 117, 118, 119], "locat": [24, 60, 109, 112, 113, 114, 117], "agre": 24, "todo": [24, 114], "legal": [24, 50, 51, 52, 53, 54], "fire": [24, 26, 28, 29, 31, 32, 35, 37, 39, 40, 50, 51, 52, 53, 54, 57, 64, 65, 67, 68, 70, 71, 73, 74, 77, 78, 80, 82, 84, 85, 90], "upright": [24, 30, 31, 35, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 63, 93, 96, 103, 104], "upleft": [24, 30, 31, 35, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 63], "downright": [24, 30, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63], "downleft": [24, 30, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63], "upfir": [24, 28, 31, 37, 50, 51, 52, 53, 54, 68, 80, 81, 82, 84, 85], "11": [24, 31, 50, 51, 52, 53, 54, 58, 61, 98, 99, 100, 101, 102, 103, 105, 106, 108, 111, 112, 116], "rightfir": [24, 26, 28, 29, 31, 32, 35, 40, 50, 51, 52, 53, 54, 58, 61, 64, 65, 67, 77, 80, 81, 84, 85], "leftfir": [24, 26, 28, 29, 31, 32, 40, 50, 51, 52, 53, 54, 58, 61, 64, 65, 67, 77, 80, 81, 84, 85], "13": [24, 31, 50, 51, 52, 53, 54, 58, 61, 98, 99, 101, 102, 105, 108, 114], "downfir": [24, 28, 31, 37, 50, 51, 52, 53, 54, 58, 61, 65, 68, 80, 82, 85], "14": [24, 50, 51, 52, 53, 54, 58, 88, 90, 98, 99, 101, 102, 105, 108, 116], "uprightfir": [24, 31, 50, 51, 52, 53, 54, 58, 61], "upleftfir": [24, 31, 50, 51, 52, 53, 54, 58, 61], "16": [24, 33, 36, 39, 45, 50, 51, 52, 53, 54, 58, 96, 98, 99, 101, 102, 105, 108, 113, 116, 119], "downrightfir": [24, 50, 51, 52, 53, 54, 58, 61], "17": [24, 36, 50, 51, 52, 53, 54, 58, 98, 99, 101, 102, 105, 108, 111], "downleftfir": [24, 50, 51, 52, 53, 54, 58, 61], "smaller": [24, 29, 31, 50, 51, 52, 53, 54], "enumer": [24, 50, 51, 52, 53, 54], "full_action_spac": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "reduc": [24, 26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85, 93, 116], "difficulti": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 109], "choic": [24, 119], "player": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 109, 111, 112, 113, 114, 116], "128": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "byte": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "ram": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "exact": [24, 37, 50, 51, 52, 53, 54, 111, 116], "atariag": [24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 79, 81, 82, 83, 84, 85, 86], "determinist": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 92, 94, 95, 117], "art": 24, "memor": 24, "sticki": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "small": [24, 54, 73, 88, 109, 110, 119], "On": [24, 65, 92, 93, 94, 95, 96], "top": [24, 39, 44, 51, 57, 59, 73, 89, 90, 91, 94, 95, 100, 103, 104, 108, 117, 119], "repeat": [24, 105], "frameskip": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "exclus": 24, "tabl": [24, 27, 28, 30, 44, 46, 101, 102, 105], "obs_typ": 24, "Its": 24, "repeat_action_prob": [24, 50, 51, 52, 53, 54], "stick": [24, 33, 55, 111, 116], "ll": [24, 57, 74, 116], "sound": 24, "lock": 24, "proper": 24, "audio": 24, "framer": [24, 102, 105, 106, 117], "best": [24, 50, 51, 52, 53, 54, 116], "practic": [24, 50, 51, 52, 53, 54, 109, 116, 118], "configur": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 91, 97, 110, 116, 117], "variat": 24, "amidardeterminist": 24, "amidarnoframeskip": 24, "ramdeterminist": 24, "ramnoframeskip": 24, "suffix": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "noframeskip": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "airraid": [24, 26], "31": [24, 31, 101, 102], "bankheist": [24, 33], "20": [24, 33, 39, 66, 74, 90, 98, 101, 102, 105, 114, 116], "24": [24, 33, 39, 64, 88, 89, 90, 93, 98, 101, 102, 116], "battlezon": [24, 34], "beamrid": [24, 35], "berzerk": [24, 43], "18": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 98, 99, 101, 102, 105, 108], "bowl": [24, 43], "breakout": [24, 43], "32": [24, 39, 56, 101, 102, 111, 119], "36": [24, 39, 101, 102, 112], "40": [24, 39, 64, 101, 102], "44": [24, 39, 101, 102], "carniv": [24, 43], "centiped": [24, 43], "22": [24, 41, 98, 101, 102, 105, 116], "86": [24, 41], "choppercommand": [24, 42], "crazyclimb": [24, 44], "defend": [24, 32, 43, 48, 64, 76], "demonattack": [24, 46], "doubledunk": [24, 47], "elevatoract": [24, 48], "enduro": [24, 43], "fishingderbi": 24, "freewai": [24, 43], "frostbit": [24, 43], "gopher": [24, 43], "gravitar": [24, 43], "hero": [24, 43], "icehockei": 24, "jamesbond": [24, 43], "journeyescap": 24, "kangaroo": [24, 43], "krull": [24, 43], "kungfumast": [24, 61], "montezumareveng": [24, 62], "mspacman": [24, 63], "namethisgam": [24, 64], "phoenix": [24, 43], "pitfal": [24, 43, 88], "pooyan": [24, 43], "50": [24, 58, 68, 74, 90, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 119], "70": [24, 68], "privateey": 24, "qbert": [24, 43], "riverraid": [24, 43], "roadrunn": [24, 72], "robotank": [24, 43, 73], "seaquest": [24, 43], "ski": [24, 43], "solari": [24, 43], "spaceinvad": 24, "stargunn": 24, "tenni": [24, 43], "timepilot": 24, "tutankham": [24, 43], "upndown": [24, 82], "ventur": [24, 43], "videopinbal": [24, 84, 85], "wizardofwor": [24, 85], "yarsreveng": 24, "zaxxon": [24, 43], "oppos": 24, "ai": [24, 109], "mg": 24, "bellemar": 24, "naddaf": 24, "j": [24, 119], "veness": 24, "platform": 24, "journal": [24, 114], "artifici": [24, 114], "intellig": [24, 114], "research": [24, 97, 103, 114], "2012": 24, "url": 24, "jair": [24, 114], "php": 24, "articl": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "view": [24, 54], "11182": 24, "250": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "160": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "enchant": [25, 41], "chalic": 25, "golden": 25, "castl": 25, "pick": [25, 48, 59, 72, 114, 116], "sword": 25, "bridg": [25, 71, 109], "magnet": 25, "fight": [25, 38, 61, 64, 109], "outmanoeuvr": 25, "dragon": 25, "flavor": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "switch": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 109], "thorough": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "discuss": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "intric": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "stochast": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 91, 92, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 112, 114], "ship": [26, 27, 29, 35, 45, 54, 76], "sidewai": [26, 29, 35, 71, 75], "protect": [26, 32, 41, 42, 53, 58, 68], "saucer": [26, 31, 78], "try": [26, 27, 28, 37, 39, 44, 67, 68, 116], "drop": [26, 33, 114], "bomb": [26, 45, 57, 65, 78], "meaning": [26, 28, 29, 30, 31, 32, 35, 37, 39, 40, 44, 46, 47, 48, 49, 58, 61, 63, 64, 65, 67, 68, 70, 75, 77, 78, 80, 81, 82, 84, 85], "210": [27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 45, 46, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86], "maze": [27, 28, 33, 36, 62, 81], "egg": 27, "scatter": [27, 69], "simultan": [27, 28], "kill": [27, 36, 55, 60], "flamethrow": 27, "tricki": 27, "situat": [27, 114], "occasion": [27, 31], "power": [27, 55, 89, 90, 95, 103, 104, 119], "pulsar": 27, "temporari": 27, "abil": 27, "score": [27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 74, 78, 79, 80, 84, 88, 90], "prize": [27, 82], "caught": [27, 33], "lose": [27, 30, 32, 41, 44, 45, 48, 55, 57, 66, 67, 69, 71, 72, 74, 75, 76, 90, 111, 116], "consult": [27, 56, 57, 58, 59, 60], "pac": 28, "man": 28, "visit": [28, 48, 89], "grid": [28, 112, 113, 114, 116, 117], "chicken": [28, 40, 51], "catch": [28, 44, 50, 72], "travers": 28, "vehicl": [29, 34, 49, 58], "big": [29, 50, 117], "mother": [29, 59, 68], "circl": [29, 117], "overhead": [29, 90], "deploi": 29, "drone": 29, "dodg": [29, 35, 74], "attack": [29, 31, 32, 35, 43, 45, 68], "horizont": [30, 40, 88, 90, 92, 117], "vertic": [30, 88, 103, 104, 117], "lyre": 30, "guid": [30, 51, 109], "award": [30, 36, 41, 44, 48, 74, 103, 104], "field": 31, "appear": [31, 33, 36, 73, 94, 95], "satellit": 31, "ufo": 31, "job": [32, 117], "submerg": 32, "citi": [32, 33, 69], "slowli": 32, "descend": 32, "toward": [32, 56, 107], "strike": [32, 37], "distanc": [32, 49, 99, 117], "defens": [32, 47], "manag": [32, 37], "seven": 32, "fought": 32, "wave": [32, 42, 46, 58, 65, 78], "outer": [32, 92], "robber": 33, "natur": [33, 111, 113, 116], "rob": 33, "getawai": 33, "polic": 33, "chase": [33, 36], "dynamit": [33, 55], "ga": [33, 89], "tank": [33, 34, 74], "nine": [33, 98], "leav": [33, 93, 97, 103, 117], "person": [34, 92, 109], "perspect": [34, 109], "3d": [34, 98, 101, 102, 109, 116], "illus": 34, "radar": [34, 85], "travel": 35, "steer": [35, 82, 89], "debri": 35, "leftifir": 35, "evil": [36, 61, 86], "touch": [36, 69, 117], "wall": [36, 39, 55, 94, 95, 114], "undefeat": 36, "otto": 36, "tri": 37, "knock": [37, 38], "pin": 37, "spar": 37, "spare": 37, "300": [37, 49, 88, 117], "oppon": [38, 50, 56, 67, 82], "ring": 38, "hit": [38, 39, 40, 41, 46, 68, 69, 72, 73, 75, 111, 116], "punch": [38, 59], "famou": 39, "paddl": [39, 67], "ball": [39, 56, 67, 84], "brick": 39, "wreak": 39, "havoc": 39, "five": [39, 69, 75, 91, 119], "214": 40, "em": 40, "gun": [40, 48], "suppli": [40, 64, 118], "ammunit": 40, "steal": [40, 50], "bullet": [40, 109], "subtract": 40, "minu": 40, "sign": [40, 103, 104, 119], "elf": [41, 113], "magic": 41, "wand": 41, "fend": 41, "spider": 41, "flea": 41, "mushroom": 41, "forest": 41, "bitten": 41, "tempor": 41, "paralyz": 41, "scorpion": 41, "round": 41, "helicopt": [42, 44, 71], "truck": [42, 72], "convoi": 42, "aircraft": [42, 80], "mini": 42, "bottom": [42, 57, 89, 94, 95, 100, 108, 112], "plane": 42, "surviv": [42, 46], "bank": [43, 71], "heist": 43, "battl": 43, "zone": 43, "beam": [43, 55], "rider": 43, "chopper": 43, "command": [43, 97], "crazi": 43, "climber": 43, "demon": 43, "doubl": [43, 97], "dunk": 43, "elev": 43, "fish": 43, "derbi": 43, "ic": [43, 46, 52, 56, 113], "hockei": [43, 56], "journei": [43, 58, 116], "kung": 43, "fu": 43, "master": [43, 112, 119], "montezuma": 43, "reveng": 43, "pacman": 43, "privat": [43, 69, 117], "ey": [43, 64, 69], "road": [43, 89], "runner": 43, "invad": [43, 77], "star": 43, "gunner": 43, "pilot": [43, 65, 86], "pinbal": 43, "wizard": [43, 61], "Of": 43, "wor": 43, "yar": 43, "builid": 44, "obstacl": [44, 58, 59], "fall": [44, 46, 66, 72, 88, 101, 112, 113, 118], "damag": [44, 73], "climb": [44, 59, 91], "fast": [44, 89, 97, 99, 101, 103, 107, 109], "least": [44, 79, 90], "row": [44, 77, 112, 113], "earth": [45, 77], "rescu": [45, 55, 59, 60, 61, 74, 76], "smart": 45, "shot": [45, 47, 48, 56, 57, 72, 109], "abduct": 45, "unlimit": 45, "laser": [45, 55, 77, 85], "missil": [45, 71], "aliv": [45, 101, 108], "face": [46, 98, 101, 102, 111, 116], "planet": [46, 54, 76], "krybor": 46, "accumul": 46, "reserv": [46, 71, 73, 74], "bunker": [46, 54], "increas": [46, 74, 90, 92, 93, 100, 107, 108, 116], "grant": [46, 90], "slai": 46, "2v2": 47, "basketbal": 47, "possess": 47, "rival": 47, "team": 47, "rule": [47, 79, 109, 111, 116], "foul": 47, "success": [47, 92, 114, 118], "secret": [48, 69], "ground": [48, 68, 88, 90, 98, 102, 109], "stair": 48, "equip": 48, "against": [48, 67, 79, 109], "floor": 48, "gather": [48, 69, 117], "apart": [48, 117], "mark": 48, "red": [48, 54, 114, 117], "door": 48, "unreleas": 48, "prototyp": 48, "500": [48, 71, 92, 93, 114, 116], "racer": 49, "nation": 49, "long": [49, 84, 93, 103, 104], "endur": 49, "race": [49, 72, 75, 87], "overtak": 49, "dai": [49, 87], "stai": 49, "meet": 49, "quota": 49, "sunfish": 50, "But": [50, 75], "fisherman": 50, "black": [50, 60, 92, 116], "shark": [50, 64, 74], "lurk": [50, 70], "surfac": [50, 74, 103, 104, 117], "lane": [51, 109], "busi": 51, "rush": 51, "hour": 51, "traffic": [51, 109], "cross": [51, 112, 113], "bailei": 52, "who": [52, 53, 58, 59, 75], "hop": [52, 70, 100, 108], "forth": 52, "arctic": 52, "river": [52, 71], "block": 52, "white": 52, "blue": [52, 54, 79, 92, 114, 117], "he": [52, 54], "hi": [52, 54, 69], "igloo": 52, "shovel": 53, "wield": 53, "farmer": 53, "crop": 53, "carrot": 53, "spacecraft": 54, "fiction": 54, "solar": 54, "landscap": 54, "miner": 55, "mine": [55, 72], "shaft": 55, "tool": [55, 62], "propel": 55, "backpack": 55, "wherev": 55, "blast": [55, 74, 76], "vermin": 55, "raft": 55, "stretch": 55, "critter": 55, "remain": [55, 58, 59, 74, 98, 112, 117, 118], "standard": [56, 98, 99, 103, 109, 119], "minut": [56, 66], "period": [56, 100, 108], "puck": 56, "angl": [56, 57, 88, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "extrem": [56, 109, 110], "rink": 56, "realli": [56, 116], "mr": 57, "bond": 57, "design": [57, 92, 98, 101, 102, 109, 110, 114, 117], "multipurpos": 57, "craft": [57, 90], "varieti": [57, 109], "motion": [57, 109], "slightli": [57, 88, 98], "jump": [57, 72, 75], "dive": 57, "lob": 57, "rate": [57, 74, 116, 119], "highest": 57, "novic": 57, "006": 57, "007": 57, "lead": 58, "peski": 58, "backstag": 58, "scarab": 58, "000": [58, 71, 74], "concert": 58, "cash": 58, "grasp": 58, "groupi": 58, "photograph": 58, "promot": 58, "encount": [58, 59, 80], "her": [59, 68], "preciou": 59, "babi": 59, "ladder": [59, 88], "bonu": [59, 73, 74, 78, 108], "fruit": 59, "monkei": 59, "corner": 59, "beast": 60, "fortress": [60, 62], "princess": [60, 61], "lyssa": 60, "sunris": 60, "monster": [60, 83], "templ": 61, "victoria": 61, "defeat": [61, 70], "acquir": [62, 97], "treasur": [62, 64, 66, 81, 83], "chamber": [62, 83], "emperor": 62, "deadli": 62, "creatur": [62, 70, 78, 109], "valuabl": 62, "pellet": 63, "ghost": 63, "discov": 64, "octopu": 64, "oxygen": [64, 74], "elimin": [65, 81, 82, 83], "war": 65, "bird": 65, "harri": 66, "jungl": 66, "die": [66, 68, 89], "misfortun": 66, "hole": [66, 113], "compet": 67, "deflect": 67, "pig": 68, "piglet": 68, "wolv": 68, "rope": 68, "balloon": 68, "guard": 68, "eat": [68, 72], "bait": 68, "wolf": 68, "stone": 68, "rock": [68, 72], "french": 69, "pierr": 69, "street": 69, "park": 69, "passag": 69, "dead": 69, "search": 69, "ringlead": 69, "henri": 69, "le": 69, "fiend": 69, "gang": 69, "evid": 69, "stolen": 69, "good": [69, 116], "statut": 69, "expir": 69, "nab": 69, "question": [69, 109], "auto": 69, "pothol": 69, "q": [70, 114, 118], "bert": 70, "cube": 70, "pyramid": 70, "destin": [70, 114], "nasti": 70, "jet": 71, "fli": 71, "fuel": [71, 76, 90], "depot": 71, "collid": [71, 74, 90], "squadron": [71, 73], "tanker": 71, "80": [71, 113], "tm": 72, "direct": [72, 74, 92, 93, 94, 95, 98, 100, 101, 103, 104, 108, 112, 113, 114, 117, 119], "outrun": 72, "wile": 72, "coyot": 72, "hazard": 72, "desert": 72, "rocket": [72, 73, 90], "cannon": [72, 77], "cliff": [72, 110], "steel": 72, "pile": 72, "birdse": 72, "cannonbal": 72, "activ": [73, 117], "scrambl": 73, "static": 73, "interfer": 73, "sensor": [73, 89], "report": [73, 88, 98, 101, 102], "flash": 73, "panel": 73, "c": [73, 90, 92, 119], "earn": 73, "twelv": 73, "abl": [74, 118], "torpedo": 74, "diver": 74, "killer": 74, "deliv": [74, 114], "six": [74, 108], "explod": 74, "anyth": 74, "decreas": [74, 90], "almost": 74, "yoursub": 74, "blow": 74, "forc": [74, 76, 90, 93, 94, 95, 98, 101, 102, 103, 104, 119], "less": [74, 88, 90, 103, 107], "worth": [74, 77], "90": [74, 116], "skier": 75, "gate": 75, "fastest": 75, "slalom": 75, "penalti": [75, 114], "warp": 76, "sector": 76, "feder": 76, "zylon": 76, "refuel": 76, "cadet": 76, "corridor": 76, "mania": [78, 80], "orang": 79, "win": [79, 111, 116], "margin": 79, "ti": 79, "sport": 79, "till": [79, 116], "technologi": 80, "increasingli": 80, "difficult": [80, 93, 97, 103, 104], "rack": 81, "tomb": 81, "guardian": 81, "baja": 82, "bugger": 82, "dungeon": 83, "beat": [85, 111], "scanner": 85, "armi": 86, "enslav": 86, "galaxi": 86, "fighter": 86, "lunar": 87, "lander": 87, "toi": [87, 111, 112, 113, 114], "contribut": 87, "earli": [87, 116, 119], "oleg": [87, 88, 89, 90], "klimov": [87, 88, 89, 90], "popular": [87, 109, 116], "benchmark": 87, "ever": 87, "joint": [88, 90, 92, 93, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "uneven": 88, "terrain": [88, 109], "hardcor": 88, "stump": 88, "1600": 88, "heurist": [88, 90], "demonstr": [88, 109], "motor": [88, 107], "hip": [88, 98, 101, 102], "knee": [88, 101, 102], "hull": 88, "angular": [88, 90, 92, 93, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "leg": [88, 90, 98, 100, 101, 102, 108], "contact": [88, 90, 97, 98, 101, 102, 103], "lidar": 88, "rangefind": 88, "measur": [88, 96, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108], "far": [88, 89, 103, 105, 106, 113], "torqu": [88, 92, 96, 98, 99, 100, 101, 102, 105, 106, 107, 108], "cost": [88, 99, 100, 107, 108, 109], "better": 88, "stand": [88, 97, 98, 101, 102, 103, 104, 116], "slight": 88, "exce": [88, 111], "closest": 88, "trace": 88, "furthest": 88, "faster": [88, 90, 102], "spent": [88, 90], "friction": [88, 107, 109], "nervous": 88, "easiest": 89, "ab": 89, "wheel": 89, "gyroscop": 89, "car_rac": 89, "rear": 89, "drive": 89, "brake": 89, "96x96": 89, "tile": 89, "732": 89, "926": 89, "rest": [89, 90, 100, 108], "playfield": 89, "lap_complete_perc": 89, "dictat": [89, 90], "percentag": [89, 116], "lap": 89, "domain_random": 89, "variant": [89, 117], "scenario": [89, 109], "background": 89, "demand": 89, "correspondingli": 89, "init": [89, 117], "scheme": [89, 109], "chri": 89, "campbel": 89, "2014": 89, "www": [89, 111, 112, 113], "iforce2d": 89, "net": [89, 111, 112, 119], "b2dtut": 89, "pontryagin": 90, "principl": 90, "engin": [90, 97], "throttl": 90, "why": 90, "pad": 90, "infinit": [90, 100, 108, 111, 116, 118], "lunar_land": 90, "orient": [90, 98, 101, 102], "sum": [90, 98, 99, 100, 101, 102, 105, 106, 107, 108, 111, 116], "closer": [90, 111], "slower": 90, "tilt": 90, "03": 90, "solut": [90, 116], "viewport": 90, "mass": [90, 98, 99, 101, 102, 107], "bodi": [90, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108], "moon": 90, "greater": [90, 92, 93, 94, 95, 99, 104, 105, 107, 111, 116], "awak": 90, "group": 90, "come": [90, 98, 99, 100, 101, 102, 103, 104, 107, 108], "sleep": 90, "littl": [90, 102], "cpu": 90, "wake": 90, "attach": [90, 93, 96, 98, 108], "graviti": [90, 93, 94, 96, 103, 104, 119], "enable_wind": 90, "wind_pow": 90, "turbulence_pow": 90, "later": [90, 116, 119], "booster": 90, "gravit": 90, "wind": 90, "tanh": [90, 119], "sin": [90, 96, 103], "pi": [90, 92, 96], "9999": 90, "rotat": [90, 92, 98, 101, 102, 105, 116], "turbul": 90, "renorm": 90, "harder": 90, "push": [90, 93, 103, 104, 109, 119], "cart": [91, 103, 104, 119], "nois": [91, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "regard": 91, "underpow": 91, "effort": 91, "easier": 91, "ones": [91, 97, 116], "57": 92, "spars": [92, 117], "coars": 92, "barto": [92, 93, 103, 104, 111, 112, 116], "book": [92, 111, 112, 116], "link": [92, 98, 99, 100, 101, 102, 106, 107], "linearli": [92, 103, 104, 119], "actuat": [92, 93, 101, 102], "swing": [92, 96], "free": [92, 96, 97, 98, 101, 102, 103, 104, 109, 116, 119], "height": [92, 100, 103, 108], "hang": 92, "downward": 92, "seen": [92, 99], "green": [92, 114], "cosin": [92, 103, 106], "theta1": 92, "sine": [92, 103, 106], "theta2": 92, "567": 92, "274": 92, "4\u03c0": 92, "9\u03c0": 92, "rad": [92, 93, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "incur": [92, 112, 114], "co": [92, 94, 95, 96, 103, 106, 109], "book_or_nip": 92, "neurip": 92, "paper": [92, 103, 114], "nip": 92, "equat": [92, 96], "confirm": 92, "radian": [92, 93, 96, 104], "1996": 92, "touretzki": 92, "mozer": 92, "hasselmo": 92, "ed": 92, "vol": [92, 114], "mit": [92, 116, 119], "proceed": 92, "cc": 92, "1995": 92, "8f1d43620bc6bb580df6e80b0dc05c48": 92, "pdf": [92, 111, 112], "anderson": [93, 103, 104], "neuronlik": [93, 103, 104], "adapt": [93, 103, 104, 112], "un": 93, "frictionless": 93, "balanc": [93, 103, 104, 119], "vari": [93, 103, 104, 119], "418": 93, "untermin": 93, "2095": 93, "allot": 93, "475": 93, "05": [93, 98, 99, 105], "07": [94, 95], "sinusoid": [94, 95], "vallei": [94, 95], "strateg": [94, 95], "hill": [94, 95], "andrew": [94, 95], "moor": [94, 95], "phd": [94, 95, 107], "thesi": [94, 95, 107], "1990": [94, 95], "techreport": [94, 95], "moore90efficientmemori": [94, 95], "author": [94, 95, 109, 116, 119], "william": [94, 95, 119], "institut": [94, 95], "univers": [94, 95], "cambridg": [94, 95], "year": [94, 95], "001": [94, 96, 100, 103, 108, 116], "0025": [94, 95], "collis": [94, 95], "inelast": [94, 95], "upon": [94, 95], "quickli": [94, 116], "penalis": [94, 95, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108], "equal": [94, 95, 103, 111, 113], "0015": 95, "45": [95, 102, 105], "999": 95, "invert": [96, 97, 119], "swingup": 96, "diagram": 96, "meter": 96, "theta": 96, "tau": 96, "counter": 96, "clockwis": 96, "theta_dt": 96, "heta": 96, "2736044": 96, "calcul": [96, 97, 98, 101, 102, 103, 105, 106, 112, 113, 114], "math": 96, "half": 97, "cheetah": 97, "standup": 97, "facilit": [97, 109], "develop": [97, 119], "biomechan": 97, "graphic": [97, 109], "anim": 97, "area": 97, "accur": 97, "octob": 97, "2021": [97, 109], "deepmind": 97, "2022": 97, "everyon": 97, "instruct": [97, 117], "websit": [97, 109], "framework": 97, "ten": [97, 111, 116], "iverteddoublependulum": 97, "gaussian": 97, "mjsim": 97, "qpo": 97, "qvel": [97, 101, 102], "indirectli": 97, "xml": [97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "tweak": [97, 107], "schulman": 98, "moritz": 98, "levin": 98, "jordan": 98, "abbeel": 98, "advantag": [98, 109, 117], "estim": [98, 118, 119], "torso": [98, 99, 100, 101, 102, 108], "eight": 98, "hing": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "rotor": [98, 99, 100, 101, 102, 107, 108], "front": [98, 99, 107], "hip_1": [98, 101, 102], "front_left_leg": [98, 101, 102], "angle_1": [98, 101, 102], "hip_2": [98, 101, 102], "front_right_leg": [98, 101, 102], "angle_2": 98, "hip_3": 98, "back_leg": 98, "angle_3": 98, "hip_4": 98, "right_back_leg": 98, "angle_4": 98, "deriv": [98, 99, 100, 101, 102, 103, 104, 107, 108, 119], "exclude_current_positions_from_observ": [98, 99, 100, 101, 107, 108], "113": 98, "regardless": [98, 99, 100, 101, 107, 108], "x_posit": [98, 99, 100, 101, 107, 108], "y_posit": [98, 101, 107], "111": 98, "z": [98, 99, 100, 101, 102, 105, 106, 108], "centr": [98, 101, 102], "ankle_1": 98, "ankle_2": 98, "ankle_3": 98, "ankle_4": 98, "19": [98, 101, 102, 105], "23": [98, 101, 102, 105, 109], "translat": [98, 101, 102, 117], "dof": [98, 101, 102], "quaternion": [98, 101, 102], "healthy_reward": [98, 100, 101, 108], "healthi": [98, 100, 101, 108], "forward_reward": [98, 99, 100, 101, 107, 108], "dt": [98, 99, 100, 101, 105, 106, 107, 108], "frametim": [98, 99, 100, 101, 107, 108], "ctrl_cost": [98, 99, 100, 101, 107, 108], "too": [98, 99, 100, 101, 102, 103, 105, 106, 107, 108], "ctrl_cost_weight": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "ctr_cost_weight": 98, "contact_cost": [98, 101], "contact_cost_weight": [98, 101], "contact_force_rang": 98, "reset_noise_scal": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "deviat": [98, 99, 103, 107, 119], "intention": [98, 101, 102], "therebi": [98, 101, 102], "unhealthi": [98, 100, 101, 108], "healthy_z_rang": [98, 100, 101, 108], "terminate_when_unhealthi": [98, 100, 101, 108], "xml_file": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "path": [98, 99, 100, 101, 105, 106, 107, 108, 113], "model": [98, 99, 100, 101, 107, 108, 109, 116], "5e": [98, 100, 101, 108], "perturb": [98, 99, 100, 101, 107, 108], "induct": [98, 99, 100, 101, 107, 108], "bia": [98, 99, 100, 101, 107, 108], "induc": [98, 99, 100, 101, 107, 108], "agnost": [98, 99, 100, 101, 102, 107, 108], "bind": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "camera": [98, 99, 100, 101, 102, 103, 104, 107, 108], "mujoco_pi": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "max_time_step": [98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108], "p": [99, 109, 112, 113, 114], "wawrzy\u0144ski": 99, "cat": 99, "paw": 99, "alloc": 99, "thigh": [99, 100, 101, 102, 108], "shin": [99, 101, 102], "feet": [99, 108], "bthigh": 99, "bshin": 99, "bfoot": 99, "fthigh": 99, "fshin": 99, "ffoot": 99, "tip": [99, 103, 107], "rootz": [99, 100, 108], "slide": [99, 100, 103, 104, 105, 106, 107, 108], "rooti": [99, 100, 108], "rootx": [99, 100, 108], "forward_reward_weight": [99, 100, 101, 107, 108], "half_cheetah": 99, "erez": [100, 101, 102, 108], "tassa": [100, 101, 102, 108], "todorov": [100, 101, 102, 108], "predict": [100, 108, 119], "nonlinear": [100, 108], "compar": [100, 107, 108, 116], "figur": [100, 108, 116, 119], "middl": [100, 108], "thigh_joint": [100, 108], "leg_joint": [100, 108], "foot_joint": [100, 108], "002": [100, 108], "008": [100, 108], "els": [100, 108, 113, 116, 117], "healthy_state_rang": 100, "fallen": 100, "healthy_angle_rang": [100, 108], "376": [101, 102], "synthesi": [101, 102], "onlin": [101, 102, 109, 111, 112], "abdomen": [101, 102], "pair": [101, 102], "arm": [101, 102, 105, 106, 109], "elbow": [101, 102, 105], "walk": [101, 108, 110, 113, 117], "right_hip_x": [101, 102], "right_thigh": [101, 102], "right_hip_z": [101, 102], "right_hip_i": [101, 102], "right_kne": [101, 102], "left_hip_x": [101, 102], "left_thigh": [101, 102], "left_hip_z": [101, 102], "left_hip_i": [101, 102], "left_kne": [101, 102], "right_shoulder1": [101, 102], "right_shoulder2": [101, 102], "right_elbow": [101, 102], "left_shoulder1": [101, 102], "left_shoulder2": [101, 102], "left_elbow": [101, 102], "378": 101, "root": [101, 102], "lower_waist": [101, 102], "abdomen_z": [101, 102], "abdomen_i": [101, 102], "pelvi": [101, 102], "abdomen_x": [101, 102], "right_upper_arm": [101, 102], "right_lower_arm": [101, 102], "left_upper_arm": [101, 102], "left_lower_arm": [101, 102], "anglular": [101, 102, 104], "29": [101, 102], "aanglular": [101, 102], "33": [101, 102], "34": 101, "35": [101, 102], "37": [101, 102], "39": [101, 102], "41": [101, 102], "43": [101, 102], "velocitti": 101, "addition": [101, 102], "cinert": [101, 102], "inertia": [101, 102], "rigid": [101, 102], "intermedi": [101, 102], "nbodi": [101, 102], "henc": [101, 102, 110, 119], "140": [101, 102], "cvel": [101, 102], "qfrc_actuat": [101, 102], "constraint": [101, 102, 103, 109], "nv": [101, 102], "cfrc_ext": [101, 102], "dim": [101, 102], "003": 101, "015": 101, "nu": [101, 102], "contact_cost_rang": 101, "lai": 102, "state_spac": 102, "uph_cost": 102, "upward": 102, "absolut": [102, 104, 108], "overal": 102, "atom": 102, "movement": [102, 117], "though": 102, "inflat": 102, "quad_ctrl_cost": 102, "quad_impact_cost": 102, "000001": 102, "105": 102, "unlik": [102, 103, 104, 105, 106, 119], "beyond": [102, 103, 104, 105, 106, 108], "slider": [103, 104], "unitless": [103, 106], "hinge2": 103, "realist": [103, 109], "accuraci": 103, "approach": [103, 116, 117, 119], "analyt": 103, "alive_bonu": 103, "distance_penalti": 103, "velocity_penalti": 103, "005": [103, 105, 106], "y_coordin": 103, "196": 103, "perpendicularli": 103, "cylind": 105, "effector": [105, 106], "fingertip": [105, 106], "shoulder": 105, "forearm": 105, "wrist": 105, "pan": 105, "r_shoulder_pan_joint": 105, "lift": 105, "r_shoulder_lift_joint": 105, "r_upper_arm_roll_joint": 105, "flex": 105, "r_elbow_flex_joint": 105, "r_forearm_roll_joint": 105, "r_wrist_flex_joint": 105, "r_wrist_roll_joint": 105, "analogi": 105, "tips_arm": 105, "obj_slidex": 105, "obj_slidei": 105, "goal_slidex": 105, "goal_slidei": 105, "sphere": 105, "reward_near": 105, "unattach": [105, 106], "reward_control": [105, 106], "euclidean": [105, 106], "perman": 105, "323": 105, "rise": 105, "asset": [105, 106, 109, 113], "gymnasmium": 105, "fixtur": 106, "joint0": 106, "joint1": 106, "target_x": 106, "target_i": 106, "position_fingertip": 106, "position_target": 106, "na": 106, "disk": 106, "radiu": 106, "everyth": 106, "02": 106, "r\u00e9mi": 107, "coulom": 107, "applic": [107, 109], "segment": 107, "articul": [107, 109], "suspend": 107, "subject": 107, "fluid": 107, "viscou": 107, "coeffici": 107, "motor1_rot": 107, "motor2_rot": 107, "\u03b8": 107, "free_body_rot": 107, "slider1": 107, "slider2": 107, "04": 107, "swim": 107, "split": 108, "thigh_left_joint": 108, "leg_left_joint": 108, "foot_left_joint": 108, "ctr_cost": 108, "procedur": [109, 119], "clone": [109, 117], "huge": 109, "3v3": 109, "hundr": 109, "roughli": 109, "tweakabl": 109, "monei": 109, "slime": 109, "volleybal": 109, "motiv": 109, "premad": 109, "foss": 109, "interoper": 109, "extens": [109, 119], "light": 109, "poli": 109, "pinocchio": 109, "meshcat": 109, "web": 109, "bitcraz": 109, "crazyfli": 109, "nanoquadrotor": 109, "endeavor": 109, "gap": 109, "deep": [109, 118, 119], "methodologi": 109, "coverag": 109, "laboratori": 109, "internet": 109, "quadrotor": 109, "casadi": 109, "symbol": 109, "priori": 109, "isaac": 109, "omnivers": 109, "cours": 109, "wide": 109, "account": 109, "yield": 109, "voltag": 109, "duti": 109, "cycl": 109, "plan": 109, "emphasi": 109, "percept": 109, "social": 109, "driver": 109, "whose": [109, 111], "uncertain": 109, "merg": 109, "intersect": 109, "roundabout": 109, "latent": 109, "transfer": 109, "miniatur": 109, "racecar": 109, "llvm": 109, "phase": 109, "gcc": 109, "cuda": 109, "p_0": 109, "morl": 109, "cell": [109, 112, 117], "warehous": 109, "storag": 109, "overfit": 109, "predefin": [109, 117], "hyperparamet": [109, 116, 119], "cheap": 109, "surrog": 109, "evolutionari": 109, "tag": 109, "answer": 109, "classif": 109, "dataset": 109, "autom": 109, "prover": 109, "vampir": 109, "theoret": 109, "workshop": 109, "minatari": 109, "bsuit": 109, "great": [109, 116], "focu": 109, "simplic": 109, "comprehens": 109, "crypto": 109, "omg": 109, "toolbox": 109, "minimalist": 109, "synthes": 109, "neuro": 109, "architectur": 109, "integr": 109, "twin": 109, "concept": 109, "seamless": 109, "firmwar": 109, "neuroflight": 109, "frozen": 110, "lake": 110, "suitabl": 110, "card": [111, 116], "dealer": [111, 116], "deck": [111, 116], "jack": 111, "queen": 111, "king": 111, "ac": [111, 116], "usabl": [111, 116], "held": 111, "decid": 111, "bust": [111, 116], "reveal": 111, "facedown": 111, "goe": 111, "outcom": 111, "hand": [111, 119], "sab": [111, 116], "2020": [111, 112], "incompleteidea": [111, 112], "rlbook2020": [111, 112], "48": 112, "4x12": 112, "world": [112, 113, 114], "132": 112, "inspir": 112, "dennybritz": 112, "blob": 112, "cliff_walk": 112, "latter": 112, "current_row": [112, 113], "nrow": [112, 113], "current_col": [112, 113], "col": [112, 113], "47": 112, "proabil": [112, 114], "slipperi": 113, "extent": 113, "4x4": 113, "perpendicular": 113, "is_slipperi": 113, "stool": 113, "franuka": 113, "itch": 113, "io": 113, "rpg": 113, "snow": 113, "tileset": 113, "mel": 113, "tilleri": 113, "cyaneu": 113, "ncol": [113, 116], "time_limit": [113, 114], "8x8": 113, "desc": 113, "map_nam": 113, "preload": 113, "sfff": 113, "fhfh": 113, "fffh": 113, "hffg": 113, "generate_random_map": 113, "toy_text": [113, 116], "frozen_lak": 113, "sfffffff": 113, "ffffffff": 113, "fffhffff": 113, "fffffhff": 113, "fhhfffhf": 113, "fhffhfhf": 113, "fffhfffg": 113, "bug": 113, "passeng": 114, "yellow": 114, "5x5": 114, "maxq": 114, "decomposit": 114, "tom": 114, "dietterich": 114, "pickup": 114, "south": 114, "north": 114, "east": 114, "west": 114, "letter": 114, "taxi_row": 114, "taxi_col": 114, "passenger_loc": 114, "404": 114, "reachabl": 114, "illeg": 114, "action_mask": 114, "fickl": 114, "Or": 114, "argmax": [114, 116], "q_valu": [114, 116], "pp": 114, "227": 114, "303": 114, "nov": 114, "doi": 114, "1613": 114, "639": 114, "cleaner": 114, "disallow": 114, "loc": 114, "passidx": 114, "maintain": 115, "capabl": 115, "insert": [115, 119], "casino": 116, "infam": 116, "beatabl": 116, "won": 116, "viabl": 116, "strategi": 116, "favorit": 116, "zemann": 116, "__future__": [116, 119], "annot": [116, 119], "defaultdict": 116, "pyplot": [116, 119], "plt": [116, 119], "seaborn": [116, 119], "sn": [116, 119], "patch": 116, "tqdm": 116, "explanatori": 116, "tell": [116, 118], "idea": [116, 118], "slow": 116, "showcas": 116, "respond": 116, "harm": 116, "greedi": 116, "blackjackag": 116, "learning_r": [116, 119], "initial_epsilon": 116, "epsilon_decai": 116, "final_epsilon": 116, "discount_factor": 116, "95": 116, "arg": [116, 119], "decai": 116, "lr": [116, 119], "training_error": 116, "get_act": 116, "greedili": 116, "exploit": 116, "next_ob": [116, 119], "future_q_valu": 116, "temporal_differ": 116, "decay_epsilon": 116, "readi": 116, "n_episod": 116, "100_000": 116, "start_epsilon": 116, "decent": [116, 119], "converg": 116, "10x": 116, "rolling_length": 116, "fig": 116, "subplot": 116, "figsiz": [116, 119], "set_titl": 116, "reward_moving_averag": 116, "convolv": 116, "length_moving_averag": 116, "training_error_moving_averag": 116, "tight_layout": 116, "create_grid": 116, "usable_ac": 116, "state_valu": 116, "action_valu": 116, "player_count": 116, "dealer_count": 116, "meshgrid": 116, "arang": 116, "apply_along_axi": 116, "arr": 116, "dstack": 116, "value_grid": 116, "policy_grid": 116, "create_plot": 116, "figaspect": 116, "suptitl": 116, "fontsiz": 116, "ax1": 116, "add_subplot": 116, "plot_surfac": 116, "rstride": 116, "cstride": 116, "cmap": 116, "viridi": 116, "edgecolor": 116, "xtick": 116, "ytick": 116, "set_xlabel": 116, "set_ylabel": 116, "zaxi": 116, "set_rotate_label": 116, "set_zlabel": 116, "view_init": 116, "220": 116, "ax2": 116, "heatmap": 116, "linewidth": 116, "accent_r": 116, "cbar": 116, "set_xticklabel": 116, "set_yticklabel": 116, "legend": 116, "legend_el": 116, "facecolor": 116, "lightgreen": 116, "label": 116, "grei": 116, "bbox_to_anchor": 116, "fig1": 116, "fig2": 116, "hopefulli": 116, "grip": 116, "challeng": 116, "mont": [116, 119], "carlo": [116, 119], "fun": [116, 119], "blackjack_tutori": 116, "ipynb": [116, 117, 118, 119], "overview": [117, 119], "virtual": 117, "git": 117, "venv": 117, "bin": 117, "concern": [117, 119], "readm": 117, "setup": 117, "gym_exampl": 117, "grid_world": 117, "relative_posit": 117, "reacher_weighted_reward": 117, "discrete_act": 117, "clip_reward": 117, "illustr": [117, 118], "simplist": 117, "gridworldenv": 117, "piec": 117, "abstract": 117, "window_s": 117, "512": 117, "_action_to_direct": 117, "assert": 117, "clock": 117, "_get_ob": 117, "mandatori": 117, "_agent_loc": 117, "_target_loc": 117, "manhattan": 117, "_get_info": 117, "oftentim": 117, "worri": 117, "coincid": 117, "earlier": 117, "array_equ": 117, "_render_fram": 117, "trivial": 117, "skeleton": 117, "set_mod": 117, "canva": 117, "pix_square_s": 117, "rect": 117, "gridlin": 117, "width": 117, "visibl": 117, "blit": 117, "get_rect": 117, "pump": 117, "delai": 117, "stabl": 117, "tick": 117, "surfarrai": 117, "pixels3d": 117, "bother": 117, "detect": 117, "put": 117, "registr": 117, "appropri": [117, 119], "entrypoint": 117, "mere": 117, "third": 117, "parti": 117, "codebas": 117, "edit": 117, "setuptool": 117, "install_requir": 117, "local": 117, "perfectli": 117, "fine": 117, "did": 118, "failur": 118, "notabl": 118, "inher": 118, "preserv": 118, "obviou": 118, "forev": 118, "forcibli": 118, "halt": 118, "formal": 118, "q_": 118, "o_t": 118, "a_t": 118, "r_t": 118, "max_a": 118, "o_": 118, "a_": 118, "q_target": 118, "distinct": 118, "frequent": 118, "differenti": 118, "vf_target": 118, "vf_next_stat": 118, "onward": 118, "handling_time_limit": 118, "scratch": 119, "earliest": 119, "gradient": 119, "burden": 119, "maxim": 119, "inverted_pendulum": 119, "1d": 119, "panda": 119, "pd": 119, "nn": 119, "rcparam": 119, "parameter": 119, "policy_network": 119, "obs_space_dim": 119, "action_space_dim": 119, "hidden_space1": 119, "feel": 119, "hidden_space2": 119, "shared_net": 119, "sequenti": 119, "policy_mean_net": 119, "std": 119, "policy_stddev_net": 119, "tensor": 119, "action_mean": 119, "action_stddev": 119, "shared_featur": 119, "exp": 119, "mention": 119, "fact": 119, "reinfroc": 119, "acronym": 119, "ward": 119, "ncrement": 119, "actor": 119, "o": 119, "ffset": 119, "einforc": 119, "haracterist": 119, "ligibl": 119, "tune": 119, "ep": 119, "mathemat": 119, "prob": 119, "adamw": 119, "sample_act": 119, "distrib": 119, "log_prob": 119, "running_g": 119, "delta": 119, "zip": 119, "zero_grad": 119, "centric": 119, "reiniti": 119, "fairli": 119, "brittl": 119, "spinningup": 119, "en": 119, "html": 119, "total_num_episod": 119, "5e3": 119, "rewards_over_se": 119, "fibonacci": 119, "manual_se": 119, "reward_over_episod": 119, "avg_reward": 119, "rewards_to_plot": 119, "df1": 119, "datafram": 119, "melt": 119, "renam": 119, "inplac": 119, "darkgrid": 119, "talk": 119, "palett": 119, "rainbow": 119, "lineplot": 119, "siddarth": 119, "chandrasekar": 119, "ronald": 119, "connectionist": 119, "machin": 119, "2004": 119, "229": 119, "256": 119, "reinforce_invpend_gym_v26": 119}, "objects": {"Space": [[9, 0, 1, "", "dtype"]], "": [[15, 1, 1, "", "action_space"], [15, 1, 1, "", "observation_space"], [15, 1, 1, "", "single_action_space"], [15, 1, 1, "", "single_observation_space"]], "gymnasium": [[17, 2, 1, "", "ActionWrapper"], [2, 2, 1, "", "Env"], [19, 2, 1, "", "ObservationWrapper"], [20, 2, 1, "", "RewardWrapper"], [16, 2, 1, "", "Wrapper"], [8, 3, 1, "", "make"], [8, 3, 1, "", "pprint_registry"], [8, 3, 1, "", "register"], [8, 3, 1, "", "spec"]], "gymnasium.ActionWrapper.ActionWrapper": [[17, 3, 1, "", "action"]], "gymnasium.Env": [[2, 1, 1, "", "action_space"], [2, 3, 1, "", "close"], [2, 1, 1, "", "metadata"], [2, 0, 1, "", "np_random"], [2, 1, 1, "", "observation_space"], [2, 3, 1, "", "render"], [2, 1, 1, "", "render_mode"], [2, 3, 1, "", "reset"], [2, 1, 1, "", "reward_range"], [2, 1, 1, "", "spec"], [2, 3, 1, "", "step"], [2, 0, 1, "", "unwrapped"]], "gymnasium.ObservationWrapper": [[19, 3, 1, "", "observation"]], "gymnasium.RewardWrapper.RewardWrapper": [[20, 3, 1, "", "reward"]], "gymnasium.Wrapper": [[16, 0, 1, "", "action_space"], [16, 3, 1, "", "close"], [16, 0, 1, "", "metadata"], [16, 0, 1, "", "np_random"], [16, 0, 1, "", "observation_space"], [16, 3, 1, "", "reset"], [16, 0, 1, "", "reward_range"], [16, 0, 1, "", "spec"], [16, 3, 1, "", "step"], [16, 0, 1, "", "unwrapped"]], "gymnasium.experimental": [[4, 2, 1, "", "FuncEnv"]], "gymnasium.experimental.FuncEnv": [[4, 3, 1, "id0", "initial"], [4, 3, 1, "id1", "observation"], [4, 3, 1, "", "render_close"], [4, 3, 1, "", "render_image"], [4, 3, 1, "", "render_init"], [4, 3, 1, "", "reward"], [4, 3, 1, "", "state_info"], [4, 3, 1, "", "step_info"], [4, 3, 1, "", "terminal"], [4, 3, 1, "", "transform"], [4, 3, 1, "", "transition"]], "gymnasium.experimental.wrappers": [[7, 2, 1, "", "ClipRewardV0"], [7, 2, 1, "", "LambdaActionV0"], [7, 2, 1, "", "LambdaObservationV0"], [7, 2, 1, "", "LambdaRewardV0"]], "gymnasium.spaces": [[11, 2, 1, "", "Box"], [10, 2, 1, "", "Dict"], [11, 2, 1, "", "Discrete"], [10, 2, 1, "", "Graph"], [11, 2, 1, "", "MultiBinary"], [11, 2, 1, "", "MultiDiscrete"], [10, 2, 1, "", "Sequence"], [9, 2, 1, "", "Space"], [11, 2, 1, "", "Text"], [10, 2, 1, "", "Tuple"]], "gymnasium.spaces.Box": [[11, 4, 1, "", "is_bounded"], [11, 4, 1, "", "sample"], [11, 4, 1, "", "seed"]], "gymnasium.spaces.Dict": [[10, 4, 1, "", "sample"], [10, 4, 1, "", "seed"]], "gymnasium.spaces.Discrete": [[11, 4, 1, "", "sample"], [11, 4, 1, "", "seed"]], "gymnasium.spaces.Graph": [[10, 4, 1, "", "sample"], [10, 4, 1, "", "seed"]], "gymnasium.spaces.MultiBinary": [[11, 4, 1, "", "sample"], [11, 4, 1, "", "seed"]], "gymnasium.spaces.MultiDiscrete": [[11, 4, 1, "", "sample"], [11, 4, 1, "", "seed"]], "gymnasium.spaces.Sequence": [[10, 4, 1, "", "sample"], [10, 4, 1, "", "seed"]], "gymnasium.spaces.Text": [[11, 4, 1, "", "sample"], [11, 4, 1, "", "seed"]], "gymnasium.spaces.Tuple": [[10, 4, 1, "", "sample"], [10, 4, 1, "", "seed"]], "gymnasium.spaces.space.Space": [[9, 3, 1, "", "contains"], [9, 3, 1, "", "from_jsonable"], [9, 3, 1, "", "sample"], [9, 3, 1, "", "seed"], [9, 0, 1, "", "shape"], [9, 3, 1, "", "to_jsonable"]], "gymnasium.spaces.utils": [[12, 3, 1, "", "flatdim"], [12, 3, 1, "", "flatten"], [12, 3, 1, "", "flatten_space"], [12, 3, 1, "", "unflatten"]], "gymnasium.utils.env_checker": [[14, 3, 1, "", "check_env"]], "gymnasium.utils.play": [[14, 2, 1, "", "PlayPlot"], [14, 2, 1, "", "PlayableGame"], [14, 3, 1, "", "play"]], "gymnasium.utils.play.PlayPlot": [[14, 4, 1, "", "callback"]], "gymnasium.utils.play.PlayableGame": [[14, 4, 1, "", "process_event"]], "gymnasium.utils.save_video": [[14, 3, 1, "", "capped_cubic_video_schedule"], [14, 3, 1, "", "save_video"]], "gymnasium.utils.seeding": [[14, 3, 1, "", "np_random"]], "gymnasium.utils.step_api_compatibility": [[14, 3, 1, "", "convert_to_done_step_api"], [14, 3, 1, "", "convert_to_terminated_truncated_step_api"], [14, 3, 1, "", "step_api_compatibility"]], "gymnasium.vector": [[15, 2, 1, "", "AsyncVectorEnv"], [15, 2, 1, "", "SyncVectorEnv"], [15, 2, 1, "", "VectorEnv"], [15, 3, 1, "", "make"]], "gymnasium.vector.VectorEnv": [[15, 4, 1, "", "close"], [15, 4, 1, "", "reset"], [15, 4, 1, "", "step"]], "gymnasium.vector.utils": [[13, 3, 1, "", "batch_space"], [13, 3, 1, "", "concatenate"], [13, 3, 1, "", "create_empty_array"], [13, 3, 1, "", "create_shared_memory"], [13, 3, 1, "", "iterate"], [13, 3, 1, "", "read_from_shared_memory"], [13, 3, 1, "", "write_to_shared_memory"]], "gymnasium.wrappers": [[18, 2, 1, "", "AtariPreprocessing"], [18, 2, 1, "", "AutoResetWrapper"], [17, 2, 1, "", "ClipAction"], [18, 2, 1, "", "EnvCompatibility"], [19, 2, 1, "", "FilterObservation"], [19, 2, 1, "", "FlattenObservation"], [19, 2, 1, "", "FrameStack"], [19, 2, 1, "", "GrayScaleObservation"], [18, 2, 1, "", "HumanRendering"], [19, 2, 1, "", "NormalizeObservation"], [20, 2, 1, "", "NormalizeReward"], [18, 2, 1, "", "OrderEnforcing"], [18, 2, 1, "", "PassiveEnvChecker"], [19, 2, 1, "", "PixelObservationWrapper"], [18, 2, 1, "", "RecordEpisodeStatistics"], [18, 2, 1, "", "RecordVideo"], [18, 2, 1, "", "RenderCollection"], [17, 2, 1, "", "RescaleAction"], [19, 2, 1, "", "ResizeObservation"], [18, 2, 1, "", "StepAPICompatibility"], [19, 2, 1, "", "TimeAwareObservation"], [18, 2, 1, "", "TimeLimit"], [19, 2, 1, "", "TransformObservation"], [20, 2, 1, "", "TransformReward"], [18, 2, 1, "", "VectorListInfo"]]}, "objtypes": {"0": "py:property", "1": "py:attribute", "2": "py:class", "3": "py:function", "4": "py:method"}, "objnames": {"0": ["py", "property", "Python property"], "1": ["py", "attribute", "Python attribute"], "2": ["py", "class", "Python class"], "3": ["py", "function", "Python function"], "4": ["py", "method", "Python method"]}, "titleterms": {"404": 0, "page": [0, 1], "Not": 0, "found": 0, "The": 0, "request": 0, "could": 0, "gymnasium": [1, 2, 4, 5, 15, 16, 115, 117], "doc": 1, "instruct": 1, "modifi": [1, 21], "environ": [1, 2, 3, 4, 5, 6, 8, 14, 15, 18, 21, 22, 23, 109, 115, 116, 117], "edit": 1, "an": [1, 116, 119], "ad": 1, "new": [1, 14], "atari": [1, 18, 24, 43], "env": [1, 2, 15, 109, 117], "non": 1, "other": [1, 109], "step": [1, 14, 22, 23, 117], "build": [1, 116, 119], "document": 1, "write": 1, "tutori": 1, "method": [2, 9, 15, 16], "attribut": [2, 9, 15, 16], "addit": 2, "implement": [2, 16], "experiment": [3, 4, 5], "function": [3, 4], "wrapper": [3, 6, 7, 16, 17, 18, 19, 20, 117], "lambda": [3, 6, 7], "observ": [3, 6, 7, 19, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116, 117], "action": [3, 6, 7, 17, 21, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 116], "reward": [3, 6, 7, 20, 24, 27, 28, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "common": [3, 6, 7, 24], "vector": [3, 5, 6, 9, 13, 15, 18], "onli": [3, 6], "funcenv": 4, "func2env": 4, "functionaljaxcompatibilityenv": 4, "vectorenv": [5, 15], "asyncvectorenv": 5, "syncvectorenv": 5, "custom": [5, 16, 117], "envpool": 5, "registri": 8, "make": [8, 15, 117], "regist": [8, 117], "all": 8, "spec": 8, "pretti": 8, "print": 8, "space": [9, 10, 11, 12, 13, 21, 24, 50, 51, 52, 53, 54, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "fundament": [9, 11], "composit": [9, 10], "util": [9, 12, 13, 14], "dict": 10, "tupl": 10, "sequenc": 10, "graph": 10, "box": [11, 38], "discret": [11, 109], "multibinari": 11, "multidiscret": 11, "text": [11, 110], "share": 13, "memori": 13, "visual": [14, 116], "save": 14, "render": [14, 18, 23, 117], "video": [14, 18, 84, 109], "old": 14, "api": [14, 22, 115], "compat": [14, 18, 22], "seed": [14, 23], "check": 14, "async": 15, "sync": 15, "clip": 17, "rescal": 17, "misc": 18, "preprocess": 18, "autoreset": 18, "passiv": 18, "checker": 18, "human": 18, "order": 18, "enforc": 18, "record": 18, "episod": [18, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "statist": 18, "collect": [18, 115], "time": [18, 19, 118], "limit": [18, 118], "list": [18, 43], "info": 18, "transform": [19, 20], "filter": 19, "flatten": 19, "framestack": 19, "grai": 19, "scale": 19, "normal": [19, 20], "pixel": 19, "resiz": 19, "awar": 19, "basic": 21, "usag": 21, "initi": [21, 117], "interact": 21, "explain": 21, "code": [21, 23, 118], "more": 21, "inform": [21, 111, 112, 113, 114], "gym": [22, 109], "load": 22, "openai": [22, 109], "v0": 22, "22": 22, "v21": 23, "v26": 23, "migrat": 23, "guid": 23, "exampl": 23, "random": 23, "number": 23, "gener": 23, "reset": [23, 89, 117], "remov": 23, "autorom": 24, "instal": 24, "rom": 24, "stochast": 24, "argument": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "version": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111, 112, 113, 114], "histori": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "name": [24, 64], "scheme": 24, "flavor": 24, "refer": [24, 89, 92, 111, 112, 114, 115, 119], "adventur": 25, "descript": [25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "air": 26, "raid": 26, "alien": 27, "amidar": 28, "assault": 29, "asterix": 30, "asteroid": 31, "atlanti": 32, "bank": 33, "heist": 33, "battl": 34, "zone": 34, "beam": 35, "rider": 35, "berzerk": 36, "bowl": 37, "breakout": 39, "carniv": 40, "centiped": 41, "chopper": 42, "command": 42, "complet": 43, "crazi": 44, "climber": 44, "defend": 45, "demon": 46, "attack": 46, "doubl": [47, 103], "dunk": 47, "elev": 48, "enduro": 49, "fishingderbi": 50, "freewai": 51, "frostbit": 52, "gopher": 53, "gravitar": 54, "hero": 55, "icehockei": 56, "jamesbond": 57, "journeyescap": 58, "kangaroo": 59, "krull": 60, "kung": 61, "fu": 61, "master": 61, "montezuma": 62, "reveng": 62, "m": 63, "pacman": 63, "thi": 64, "game": [64, 109], "phoenix": 65, "pitfal": 66, "pong": 67, "pooyan": 68, "privateey": 69, "qbert": 70, "riverraid": 71, "road": 72, "runner": 72, "robot": [73, 109], "tank": 73, "seaquest": 74, "ski": 75, "solari": 76, "spaceinvad": 77, "stargunn": 78, "tenni": 79, "timepilot": 80, "tutankham": 81, "up": 82, "n": 82, "down": 82, "ventur": 83, "pinbal": 84, "wizard": 85, "wor": 85, "zaxxon": 86, "box2d": 87, "biped": 88, "walker": 88, "start": [88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "state": [88, 89, 90, 92, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114, 117], "termin": [88, 89, 90, 118], "credit": [88, 89, 90], "car": [89, 94, 95], "race": [89, 109], "lunar": 90, "lander": 90, "classic": [91, 109], "control": [91, 109], "acrobot": 92, "end": [92, 93, 94, 95, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 111, 112, 113, 114], "cart": 93, "pole": 93, "mountain": [94, 95], "transit": [94, 95], "dynam": [94, 95, 109], "continu": 95, "pendulum": [96, 103, 104], "truncat": [96, 118], "mujoco": [97, 119], "ant": 98, "half": 99, "cheetah": 99, "hopper": 100, "humanoid": [101, 102], "standup": 102, "invert": [103, 104], "pusher": 105, "reacher": 106, "swimmer": 107, "note": 107, "walker2d": 108, "third": 109, "parti": 109, "stabl": 109, "retro": 109, "maintain": 109, "flappi": 109, "bird": 109, "A": 109, "derk": 109, "gpu": 109, "acceler": 109, "moba": 109, "slimevolleygym": 109, "simpl": 109, "singl": 109, "multi": 109, "agent": [109, 116, 119], "reinforc": [109, 115, 119], "learn": [109, 115, 116, 118, 119], "uniti": 109, "ml": 109, "engin": 109, "pge": 109, "parallel": 109, "jimini": 109, "train": [109, 116, 119], "pybullet": 109, "drone": 109, "quadcopt": 109, "marsexplor": 109, "mar": 109, "panda": 109, "us": [109, 117, 119], "physic": 109, "robo": 109, "real": 109, "world": 109, "simul": 109, "offworld": 109, "safe": 109, "softrobot": 109, "soft": 109, "igibson": 109, "dexteroushand": 109, "dual": 109, "dexter": 109, "hand": 109, "manipul": 109, "task": 109, "omniisaacgymenv": 109, "autonom": 109, "drive": 109, "sumo": 109, "rl": 109, "duckietown": 109, "electr": 109, "motor": 109, "highwai": 109, "commonroad": 109, "tmrl": 109, "trackmania": 109, "2020": 109, "through": 109, "racing_dream": 109, "l2r": 109, "multimod": 109, "where": 109, "how": 109, "racecar_gym": 109, "compilergym": 109, "optimis": 109, "compil": 109, "carl": 109, "context": 109, "adapt": 109, "matrix": 109, "mdp": 109, "easili": 109, "creat": [109, 117], "mo": 109, "object": 109, "cellular": 109, "automata": 109, "sokoban": 109, "2d": 109, "transport": 109, "puzzl": 109, "dacbench": 109, "benchmark": 109, "librari": 109, "algorithm": 109, "configur": 109, "nlpgym": 109, "toolkit": 109, "develop": 109, "solv": [109, 116], "nlp": 109, "satur": 109, "prove": 109, "theorem": 109, "shinrl": 109, "evalu": 109, "gymnax": 109, "hardwar": 109, "anytrad": 109, "financi": 109, "trade": 109, "forex": 109, "stock": 109, "mtsim": 109, "metatrad": 109, "5": 109, "platform": 109, "openmodelica": 109, "microgrid": 109, "power": 109, "electron": 109, "convert": 109, "mobil": 109, "coordin": 109, "wireless": 109, "network": [109, 119], "gymfc": 109, "flight": 109, "tune": 109, "framework": 109, "toi": 110, "blackjack": [111, 116], "cliff": 112, "walk": 112, "frozen": 113, "lake": 113, "taxi": 114, "i": 115, "standard": 115, "divers": 115, "q": 116, "import": [116, 118], "setup": 116, "execut": 116, "visualis": 116, "polici": [116, 119], "think": 116, "you": 116, "can": 116, "do": 116, "better": 116, "your": 117, "own": 117, "subclass": 117, "declar": 117, "construct": 117, "from": 117, "close": 117, "packag": 117, "instanc": 117, "handl": 118, "solut": 118, "plot": 119, "curv": 119}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 8, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx": 57}, "alltitles": {"404 - Page Not Found": [[0, "page-not-found"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Gymnasium-docs": [[1, "gymnasium-docs"]], "Instructions for modifying environment pages": [[1, "instructions-for-modifying-environment-pages"]], "Editing an environment page": [[1, "editing-an-environment-page"]], "Adding a new environment": [[1, "adding-a-new-environment"]], "Atari env": [[1, "atari-env"]], "Non-Atari env": [[1, "non-atari-env"]], "Other steps": [[1, "other-steps"]], "Build the Documentation": [[1, "build-the-documentation"]], "Writing Tutorials": [[1, "writing-tutorials"]], "Env": [[2, "env"]], "gymnasium.Env": [[2, "gymnasium-env"]], "Methods": [[2, "methods"], [9, "methods"], [15, "methods"], [16, "methods"]], "Attributes": [[2, "attributes"], [9, "attributes"], [15, "attributes"], [16, "attributes"]], "Additional Methods": [[2, "additional-methods"]], "Implementing environments": [[2, "implementing-environments"]], "Experimental": [[3, "experimental"]], "Functional Environments": [[3, "functional-environments"]], "Wrappers": [[3, "wrappers"], [7, "wrappers"], [16, "wrappers"]], "Lambda Observation Wrappers": [[3, "lambda-observation-wrappers"], [7, "lambda-observation-wrappers"]], "Lambda Action Wrappers": [[3, "lambda-action-wrappers"], [7, "lambda-action-wrappers"]], "Lambda Reward Wrappers": [[3, "lambda-reward-wrappers"], [7, "lambda-reward-wrappers"]], "Common Wrappers": [[3, "common-wrappers"], [7, "common-wrappers"]], "Vector Only Wrappers": [[3, "vector-only-wrappers"], [6, "vector-only-wrappers"]], "Vector Environment": [[3, "vector-environment"]], "Wrappers for Vector Environments": [[3, "wrappers-for-vector-environments"]], "Functional Environment": [[4, "functional-environment"]], "gymnasium.experimental.FuncEnv": [[4, "gymnasium-experimental-funcenv"]], "gymnasium.experimental.func2env.FunctionalJaxCompatibilityEnv": [[4, "gymnasium-experimental-func2env-functionaljaxcompatibilityenv"]], "Vectorizing Environment": [[5, "vectorizing-environment"]], "gymnasium.experimental.VectorEnv": [[5, "gymnasium-experimental-vectorenv"]], "gymnasium.experimental.vector.AsyncVectorEnv": [[5, "gymnasium-experimental-vector-asyncvectorenv"]], "gymnasium.experimental.vector.SyncVectorEnv": [[5, "gymnasium-experimental-vector-syncvectorenv"]], "Custom Vector environments": [[5, "custom-vector-environments"]], "EnvPool": [[5, "envpool"]], "Vector Environment Wrappers": [[6, "vector-environment-wrappers"]], "Vector Lambda Observation Wrappers": [[6, "vector-lambda-observation-wrappers"]], "Vector Lambda Action Wrappers": [[6, "vector-lambda-action-wrappers"]], "Vector Lambda Reward Wrappers": [[6, "vector-lambda-reward-wrappers"]], "Vector Common Wrappers": [[6, "vector-common-wrappers"]], "Registry": [[8, "registry"]], "Make": [[8, "make"]], "Register": [[8, "register"]], "All registered environments": [[8, "all-registered-environments"]], "Spec": [[8, "spec"]], "Pretty print registry": [[8, "pretty-print-registry"]], "Spaces": [[9, "spaces"]], "Fundamental Spaces": [[9, "fundamental-spaces"], [11, "fundamental-spaces"]], "Composite Spaces": [[9, "composite-spaces"], [10, "composite-spaces"]], "Utils": [[9, "utils"], [14, "utils"]], "Vector Utils": [[9, "vector-utils"]], "Dict": [[10, "dict"]], "Tuple": [[10, "tuple"]], "Sequence": [[10, "sequence"]], "Graph": [[10, "graph"]], "Box": [[11, "box"]], "Discrete": [[11, "discrete"]], "MultiBinary": [[11, "multibinary"]], "MultiDiscrete": [[11, "multidiscrete"]], "Text": [[11, "text"]], "Spaces Utils": [[12, "spaces-utils"]], "Spaces Vector Utils": [[13, "spaces-vector-utils"]], "Shared Memory Utils": [[13, "shared-memory-utils"]], "Visualization": [[14, "visualization"]], "Save Rendering Videos": [[14, "save-rendering-videos"]], "Old to New Step API Compatibility": [[14, "old-to-new-step-api-compatibility"]], "Seeding": [[14, "seeding"]], "Environment Checking": [[14, "environment-checking"]], "Vector": [[15, "vector"]], "Gymnasium.vector.VectorEnv": [[15, "gymnasium-vector-vectorenv"]], "Making Vector Environments": [[15, "making-vector-environments"]], "Async Vector Env": [[15, "async-vector-env"]], "Sync Vector Env": [[15, "sync-vector-env"]], "gymnasium.Wrapper": [[16, "gymnasium-wrapper"]], "Gymnasium Wrappers": [[16, "gymnasium-wrappers"]], "Implementing a custom wrapper": [[16, "implementing-a-custom-wrapper"]], "Action Wrappers": [[17, "action-wrappers"]], "Action Wrapper": [[17, "action-wrapper"]], "Clip Action": [[17, "clip-action"]], "Rescale Action": [[17, "rescale-action"]], "Misc Wrappers": [[18, "misc-wrappers"]], "Atari Preprocessing": [[18, "atari-preprocessing"]], "Autoreset": [[18, "autoreset"]], "Compatibility": [[18, "compatibility"]], "Passive Environment Checker": [[18, "passive-environment-checker"]], "Human Rendering": [[18, "human-rendering"]], "Order Enforcing": [[18, "order-enforcing"]], "Record Episode Statistics": [[18, "record-episode-statistics"]], "Record Video": [[18, "record-video"]], "Render Collection": [[18, "render-collection"]], "Time Limit": [[18, "time-limit"]], "Vector List Info": [[18, "vector-list-info"]], "Observation Wrappers": [[19, "observation-wrappers"]], "Observation Wrapper": [[19, "observation-wrapper"]], "Transform Observation": [[19, "transform-observation"]], "Filter Observation": [[19, "filter-observation"]], "Flatten Observation": [[19, "flatten-observation"]], "Framestack Observations": [[19, "framestack-observations"]], "Gray Scale Observation": [[19, "gray-scale-observation"]], "Normalize Observation": [[19, "normalize-observation"]], "Pixel Observation Wrapper": [[19, "pixel-observation-wrapper"]], "Resize Observation": [[19, "resize-observation"]], "Time Aware Observation": [[19, "time-aware-observation"]], "Reward Wrappers": [[20, "reward-wrappers"]], "Reward Wrapper": [[20, "reward-wrapper"]], "Transform Reward": [[20, "transform-reward"]], "Normalize Reward": [[20, "normalize-reward"]], "Basic Usage": [[21, "basic-usage"]], "Initializing Environments": [[21, "initializing-environments"]], "Interacting with the Environment": [[21, "interacting-with-the-environment"]], "Explaining the code": [[21, "explaining-the-code"]], "Action and observation spaces": [[21, "action-and-observation-spaces"]], "Modifying the environment": [[21, "modifying-the-environment"]], "More information": [[21, "more-information"]], "Compatibility with Gym": [[22, "compatibility-with-gym"]], "Loading OpenAI Gym environments": [[22, "loading-openai-gym-environments"]], "Gym v0.22 Environment Compatibility": [[22, "gym-v0-22-environment-compatibility"]], "Step API Compatibility": [[22, "step-api-compatibility"]], "v21 to v26 Migration Guide": [[23, "v21-to-v26-migration-guide"]], "Example code for v21": [[23, "example-code-for-v21"]], "Example code for v26": [[23, "example-code-for-v26"]], "Seed and random number generator": [[23, "seed-and-random-number-generator"]], "Environment Reset": [[23, "environment-reset"]], "Environment Step": [[23, "environment-step"]], "Environment Render": [[23, "environment-render"]], "Removed code": [[23, "removed-code"]], "Atari": [[24, "atari"]], "AutoROM (installing the ROMs)": [[24, "autorom-installing-the-roms"]], "Action Space": [[24, "action-space"], [50, "action-space"], [51, "action-space"], [52, "action-space"], [53, "action-space"], [54, "action-space"], [88, "action-space"], [89, "action-space"], [90, "action-space"], [92, "action-space"], [93, "action-space"], [94, "action-space"], [95, "action-space"], [96, "action-space"], [98, "action-space"], [99, "action-space"], [100, "action-space"], [101, "action-space"], [102, "action-space"], [103, "action-space"], [104, "action-space"], [105, "action-space"], [106, "action-space"], [107, "action-space"], [108, "action-space"], [111, "action-space"], [112, "action-space"], [113, "action-space"], [114, "action-space"]], "Observation Space": [[24, "observation-space"], [88, "observation-space"], [89, "observation-space"], [90, "observation-space"], [92, "observation-space"], [93, "observation-space"], [94, "observation-space"], [95, "observation-space"], [96, "observation-space"], [98, "observation-space"], [99, "observation-space"], [100, "observation-space"], [101, "observation-space"], [102, "observation-space"], [103, "observation-space"], [104, "observation-space"], [105, "observation-space"], [106, "observation-space"], [107, "observation-space"], [108, "observation-space"], [111, "observation-space"], [112, "observation-space"], [113, "observation-space"], [114, "observation-space"]], "Rewards": [[24, "rewards"], [27, "rewards"], [28, "rewards"], [30, "rewards"], [31, "rewards"], [32, "rewards"], [33, "rewards"], [34, "rewards"], [35, "rewards"], [36, "rewards"], [37, "rewards"], [38, "rewards"], [39, "rewards"], [40, "rewards"], [41, "rewards"], [42, "rewards"], [44, "rewards"], [45, "rewards"], [46, "rewards"], [47, "rewards"], [48, "rewards"], [49, "rewards"], [50, "rewards"], [51, "rewards"], [52, "rewards"], [53, "rewards"], [54, "rewards"], [55, "rewards"], [56, "rewards"], [57, "rewards"], [58, "rewards"], [59, "rewards"], [60, "rewards"], [66, "rewards"], [67, "rewards"], [68, "rewards"], [69, "rewards"], [70, "rewards"], [71, "rewards"], [72, "rewards"], [73, "rewards"], [74, "rewards"], [75, "rewards"], [76, "rewards"], [77, "rewards"], [78, "rewards"], [79, "rewards"], [80, "rewards"], [88, "rewards"], [89, "rewards"], [90, "rewards"], [92, "rewards"], [93, "rewards"], [96, "rewards"], [98, "rewards"], [99, "rewards"], [100, "rewards"], [101, "rewards"], [102, "rewards"], [103, "rewards"], [104, "rewards"], [105, "rewards"], [106, "rewards"], [107, "rewards"], [108, "rewards"], [111, "rewards"], [113, "rewards"], [114, "rewards"]], "Stochasticity": [[24, "stochasticity"]], "Common Arguments": [[24, "common-arguments"]], "Version History and Naming Schemes": [[24, "version-history-and-naming-schemes"]], "Flavors": [[24, "flavors"]], "References": [[24, "references"], [89, "references"], [92, "references"], [111, "references"], [112, "references"], [114, "references"], [119, "references"]], "Adventure": [[25, "adventure"]], "Description": [[25, "description"], [26, "description"], [27, "description"], [28, "description"], [29, "description"], [30, "description"], [31, "description"], [32, "description"], [33, "description"], [34, "description"], [35, "description"], [36, "description"], [37, "description"], [38, "description"], [39, "description"], [40, "description"], [41, "description"], [42, "description"], [44, "description"], [45, "description"], [46, "description"], [47, "description"], [48, "description"], [49, "description"], [50, "description"], [51, "description"], [52, "description"], [53, "description"], [54, "description"], [55, "description"], [56, "description"], [57, "description"], [58, "description"], [59, "description"], [60, "description"], [61, "description"], [62, "description"], [63, "description"], [64, "description"], [65, "description"], [66, "description"], [67, "description"], [68, "description"], [69, "description"], [70, "description"], [71, "description"], [72, "description"], [73, "description"], [74, "description"], [75, "description"], [76, "description"], [77, "description"], [78, "description"], [79, "description"], [80, "description"], [81, "description"], [82, "description"], [83, "description"], [84, "description"], [85, "description"], [86, "description"], [88, "description"], [89, "description"], [90, "description"], [92, "description"], [93, "description"], [94, "description"], [95, "description"], [96, "description"], [98, "description"], [99, "description"], [100, "description"], [101, "description"], [102, "description"], [103, "description"], [104, "description"], [105, "description"], [106, "description"], [107, "description"], [108, "description"], [111, "description"], [112, "description"], [113, "description"], [114, "description"]], "Actions": [[25, "actions"], [26, "actions"], [27, "actions"], [28, "actions"], [29, "actions"], [30, "actions"], [31, "actions"], [32, "actions"], [33, "actions"], [34, "actions"], [35, "actions"], [36, "actions"], [37, "actions"], [38, "actions"], [39, "actions"], [40, "actions"], [41, "actions"], [42, "actions"], [44, "actions"], [45, "actions"], [46, "actions"], [47, "actions"], [48, "actions"], [49, "actions"], [55, "actions"], [56, "actions"], [57, "actions"], [58, "actions"], [59, "actions"], [60, "actions"], [61, "actions"], [62, "actions"], [63, "actions"], [64, "actions"], [65, "actions"], [66, "actions"], [67, "actions"], [68, "actions"], [69, "actions"], [70, "actions"], [71, "actions"], [72, "actions"], [73, "actions"], [74, "actions"], [75, "actions"], [76, "actions"], [77, "actions"], [78, "actions"], [79, "actions"], [80, "actions"], [81, "actions"], [82, "actions"], [83, "actions"], [84, "actions"], [85, "actions"], [86, "actions"]], "Observations": [[25, "observations"], [26, "observations"], [27, "observations"], [28, "observations"], [29, "observations"], [30, "observations"], [31, "observations"], [32, "observations"], [33, "observations"], [34, "observations"], [35, "observations"], [36, "observations"], [37, "observations"], [38, "observations"], [39, "observations"], [40, "observations"], [41, "observations"], [42, "observations"], [44, "observations"], [45, "observations"], [46, "observations"], [47, "observations"], [48, "observations"], [49, "observations"], [50, "observations"], [51, "observations"], [52, "observations"], [53, "observations"], [54, "observations"], [55, "observations"], [56, "observations"], [57, "observations"], [58, "observations"], [59, "observations"], [60, "observations"], [61, "observations"], [62, "observations"], [63, "observations"], [64, "observations"], [65, "observations"], [66, "observations"], [67, "observations"], [68, "observations"], [69, "observations"], [70, "observations"], [71, "observations"], [72, "observations"], [73, "observations"], [74, "observations"], [75, "observations"], [76, "observations"], [77, "observations"], [78, "observations"], [79, "observations"], [80, "observations"], [81, "observations"], [82, "observations"], [83, "observations"], [84, "observations"], [85, "observations"], [86, "observations"]], "Arguments": [[25, "arguments"], [26, "arguments"], [27, "arguments"], [28, "arguments"], [29, "arguments"], [30, "arguments"], [31, "arguments"], [32, "arguments"], [33, "arguments"], [34, "arguments"], [35, "arguments"], [36, "arguments"], [37, "arguments"], [38, "arguments"], [39, "arguments"], [40, "arguments"], [41, "arguments"], [42, "arguments"], [44, "arguments"], [45, "arguments"], [46, "arguments"], [47, "arguments"], [48, "arguments"], [49, "arguments"], [50, "arguments"], [51, "arguments"], [52, "arguments"], [53, "arguments"], [54, "arguments"], [55, "arguments"], [56, "arguments"], [57, "arguments"], [58, "arguments"], [59, "arguments"], [60, "arguments"], [61, "arguments"], [62, "arguments"], [63, "arguments"], [64, "arguments"], [65, "arguments"], [66, "arguments"], [67, "arguments"], [68, "arguments"], [69, "arguments"], [70, "arguments"], [71, "arguments"], [72, "arguments"], [73, "arguments"], [74, "arguments"], [75, "arguments"], [76, "arguments"], [77, "arguments"], [78, "arguments"], [79, "arguments"], [80, "arguments"], [81, "arguments"], [82, "arguments"], [83, "arguments"], [84, "arguments"], [85, "arguments"], [86, "arguments"], [88, "arguments"], [89, "arguments"], [90, "arguments"], [92, "arguments"], [93, "arguments"], [94, "arguments"], [95, "arguments"], [96, "arguments"], [98, "arguments"], [99, "arguments"], [100, "arguments"], [101, "arguments"], [102, "arguments"], [103, "arguments"], [104, "arguments"], [105, "arguments"], [106, "arguments"], [107, "arguments"], [108, "arguments"], [111, "arguments"], [112, "arguments"], [113, "arguments"], [114, "arguments"]], "Version History": [[25, "version-history"], [26, "version-history"], [27, "version-history"], [28, "version-history"], [29, "version-history"], [30, "version-history"], [31, "version-history"], [32, "version-history"], [33, "version-history"], [34, "version-history"], [35, "version-history"], [36, "version-history"], [37, "version-history"], [38, "version-history"], [39, "version-history"], [40, "version-history"], [41, "version-history"], [42, "version-history"], [44, "version-history"], [45, "version-history"], [46, "version-history"], [47, "version-history"], [48, "version-history"], [49, "version-history"], [50, "version-history"], [51, "version-history"], [52, "version-history"], [53, "version-history"], [54, "version-history"], [55, "version-history"], [56, "version-history"], [57, "version-history"], [58, "version-history"], [59, "version-history"], [60, "version-history"], [61, "version-history"], [62, "version-history"], [63, "version-history"], [64, "version-history"], [65, "version-history"], [66, "version-history"], [67, "version-history"], [68, "version-history"], [69, "version-history"], [70, "version-history"], [71, "version-history"], [72, "version-history"], [73, "version-history"], [74, "version-history"], [75, "version-history"], [76, "version-history"], [77, "version-history"], [78, "version-history"], [79, "version-history"], [80, "version-history"], [81, "version-history"], [82, "version-history"], [83, "version-history"], [84, "version-history"], [85, "version-history"], [86, "version-history"], [88, "version-history"], [89, "version-history"], [90, "version-history"], [92, "version-history"], [94, "version-history"], [95, "version-history"], [96, "version-history"], [98, "version-history"], [99, "version-history"], [100, "version-history"], [101, "version-history"], [102, "version-history"], [103, "version-history"], [104, "version-history"], [105, "version-history"], [106, "version-history"], [107, "version-history"], [108, "version-history"], [111, "version-history"], [112, "version-history"], [113, "version-history"], [114, "version-history"]], "Air Raid": [[26, "air-raid"]], "Alien": [[27, "alien"]], "Amidar": [[28, "amidar"]], "Assault": [[29, "assault"]], "Asterix": [[30, "asterix"]], "Asteroids": [[31, "asteroids"]], "Atlantis": [[32, "atlantis"]], "Bank Heist": [[33, "bank-heist"]], "Battle Zone": [[34, "battle-zone"]], "Beam Rider": [[35, "beam-rider"]], "Berzerk": [[36, "berzerk"]], "Bowling": [[37, "bowling"]], "Boxing": [[38, "boxing"]], "Breakout": [[39, "breakout"]], "Carnival": [[40, "carnival"]], "Centipede": [[41, "centipede"]], "Chopper Command": [[42, "chopper-command"]], "Complete List - Atari": [[43, "complete-list-atari"]], "Crazy Climber": [[44, "crazy-climber"]], "Defender": [[45, "defender"]], "Demon Attack": [[46, "demon-attack"]], "Double Dunk": [[47, "double-dunk"]], "Elevator Action": [[48, "elevator-action"]], "Enduro": [[49, "enduro"]], "FishingDerby": [[50, "fishingderby"]], "Freeway": [[51, "freeway"]], "Frostbite": [[52, "frostbite"]], "Gopher": [[53, "gopher"]], "Gravitar": [[54, "gravitar"]], "Hero": [[55, "hero"]], "IceHockey": [[56, "icehockey"]], "Jamesbond": [[57, "jamesbond"]], "JourneyEscape": [[58, "journeyescape"]], "Kangaroo": [[59, "kangaroo"]], "Krull": [[60, "krull"]], "Kung Fu Master": [[61, "kung-fu-master"]], "Montezuma Revenge": [[62, "montezuma-revenge"]], "Ms Pacman": [[63, "ms-pacman"]], "Name This Game": [[64, "name-this-game"]], "Phoenix": [[65, "phoenix"]], "Pitfall": [[66, "pitfall"]], "Pong": [[67, "pong"]], "Pooyan": [[68, "pooyan"]], "PrivateEye": [[69, "privateeye"]], "Qbert": [[70, "qbert"]], "Riverraid": [[71, "riverraid"]], "Road Runner": [[72, "road-runner"]], "Robot Tank": [[73, "robot-tank"]], "Seaquest": [[74, "seaquest"]], "Skiings": [[75, "skiings"]], "Solaris": [[76, "solaris"]], "SpaceInvaders": [[77, "spaceinvaders"]], "StarGunner": [[78, "stargunner"]], "Tennis": [[79, "tennis"]], "TimePilot": [[80, "timepilot"]], "Tutankham": [[81, "tutankham"]], "Up n\u2019 Down": [[82, "up-n-down"]], "Venture": [[83, "venture"]], "Video Pinball": [[84, "video-pinball"]], "Wizard of Wor": [[85, "wizard-of-wor"]], "Zaxxon": [[86, "zaxxon"]], "Box2D": [[87, "box2d"]], "Bipedal Walker": [[88, "bipedal-walker"]], "Starting State": [[88, "starting-state"], [89, "starting-state"], [90, "starting-state"], [92, "starting-state"], [93, "starting-state"], [94, "starting-state"], [95, "starting-state"], [96, "starting-state"], [98, "starting-state"], [99, "starting-state"], [100, "starting-state"], [101, "starting-state"], [102, "starting-state"], [103, "starting-state"], [104, "starting-state"], [105, "starting-state"], [106, "starting-state"], [107, "starting-state"], [108, "starting-state"], [111, "starting-state"], [112, "starting-state"], [113, "starting-state"], [114, "starting-state"]], "Episode Termination": [[88, "episode-termination"], [89, "episode-termination"], [90, "episode-termination"]], "Credits": [[88, "credits"], [89, "credits"], [90, "credits"]], "Car Racing": [[89, "car-racing"]], "Reset Arguments": [[89, "reset-arguments"]], "Lunar Lander": [[90, "lunar-lander"]], "Classic Control": [[91, "classic-control"]], "Acrobot": [[92, "acrobot"]], "Episode End": [[92, "episode-end"], [93, "episode-end"], [94, "episode-end"], [95, "episode-end"], [98, "episode-end"], [99, "episode-end"], [100, "episode-end"], [101, "episode-end"], [102, "episode-end"], [103, "episode-end"], [104, "episode-end"], [105, "episode-end"], [106, "episode-end"], [107, "episode-end"], [108, "episode-end"], [111, "episode-end"], [112, "episode-end"], [113, "episode-end"], [114, "episode-end"]], "Cart Pole": [[93, "cart-pole"]], "Mountain Car": [[94, "mountain-car"]], "Transition Dynamics:": [[94, "transition-dynamics"], [95, "transition-dynamics"]], "Reward:": [[94, "reward"]], "Mountain Car Continuous": [[95, "mountain-car-continuous"]], "Reward": [[95, "reward"], [112, "reward"]], "Pendulum": [[96, "pendulum"]], "Episode Truncation": [[96, "episode-truncation"]], "MuJoCo": [[97, "mujoco"]], "Ant": [[98, "ant"]], "Half Cheetah": [[99, "half-cheetah"]], "Hopper": [[100, "hopper"]], "Humanoid": [[101, "humanoid"]], "Humanoid Standup": [[102, "humanoid-standup"]], "Inverted Double Pendulum": [[103, "inverted-double-pendulum"]], "Inverted Pendulum": [[104, "inverted-pendulum"]], "Pusher": [[105, "pusher"]], "Reacher": [[106, "reacher"]], "Swimmer": [[107, "swimmer"]], "Notes": [[107, "notes"]], "Walker2D": [[108, "walker2d"]], "Third-party Environments": [[109, "third-party-environments"]], "Video Game environments": [[109, "video-game-environments"]], "stable-retro: Classic retro games, a maintained version of OpenAI Retro": [[109, "stable-retro-classic-retro-games-a-maintained-version-of-openai-retro"]], "flappy-bird-gym: A Flappy Bird environment for Gym": [[109, "flappy-bird-gym-a-flappy-bird-environment-for-gym"]], "gym-derk: GPU accelerated MOBA environment": [[109, "gym-derk-gpu-accelerated-moba-environment"]], "SlimeVolleyGym: A simple environment for single and multi-agent reinforcement learning": [[109, "slimevolleygym-a-simple-environment-for-single-and-multi-agent-reinforcement-learning"]], "Unity ML Agents: Environments for Unity game engine": [[109, "unity-ml-agents-environments-for-unity-game-engine"]], "PGE: Parallel Game Engine": [[109, "pge-parallel-game-engine"]], "Robotics environments": [[109, "robotics-environments"]], "gym-jiminy: Training Robots in Jiminy": [[109, "gym-jiminy-training-robots-in-jiminy"]], "gym-pybullet-drones: Environments for quadcopter control": [[109, "gym-pybullet-drones-environments-for-quadcopter-control"]], "MarsExplorer: Environments for controlling robot on Mars": [[109, "marsexplorer-environments-for-controlling-robot-on-mars"]], "panda-gym: Robotics environments using the PyBullet physics engine": [[109, "panda-gym-robotics-environments-using-the-pybullet-physics-engine"]], "robo-gym: Real-world and simulation robotics": [[109, "robo-gym-real-world-and-simulation-robotics"]], "Offworld-gym": [[109, "offworld-gym"]], "safe-control-gym": [[109, "safe-control-gym"]], "gym-softrobot: Soft-robotics environments": [[109, "gym-softrobot-soft-robotics-environments"]], "iGibson": [[109, "igibson"]], "DexterousHands: dual dexterous hand manipulation tasks": [[109, "dexteroushands-dual-dexterous-hand-manipulation-tasks"]], "OmniIsaacGymEnvs": [[109, "omniisaacgymenvs"]], "Autonomous Driving environments": [[109, "autonomous-driving-environments"]], "sumo-rl": [[109, "sumo-rl"]], "gym-duckietown": [[109, "gym-duckietown"]], "gym-electric-motor": [[109, "gym-electric-motor"]], "highway-env": [[109, "highway-env"]], "CommonRoad-RL": [[109, "commonroad-rl"]], "tmrl: TrackMania 2020 through RL": [[109, "tmrl-trackmania-2020-through-rl"]], "racing_dreamer": [[109, "racing-dreamer"]], "l2r: Multimodal control environment where agents learn how to race": [[109, "l2r-multimodal-control-environment-where-agents-learn-how-to-race"]], "racecar_gym": [[109, "racecar-gym"]], "Other environments": [[109, "other-environments"]], "CompilerGym: Optimise compiler tasks": [[109, "compilergym-optimise-compiler-tasks"]], "CARL: context adaptive RL": [[109, "carl-context-adaptive-rl"]], "matrix-mdp: Easily create discrete MDPs": [[109, "matrix-mdp-easily-create-discrete-mdps"]], "mo-gym: Multi-objective Reinforcement Learning environments": [[109, "mo-gym-multi-objective-reinforcement-learning-environments"]], "gym-cellular-automata: Cellular Automata environments": [[109, "gym-cellular-automata-cellular-automata-environments"]], "gym-sokoban: 2D Transportation Puzzles": [[109, "gym-sokoban-2d-transportation-puzzles"]], "DACBench: Benchmark Library for Dynamic Algorithm configuration": [[109, "dacbench-benchmark-library-for-dynamic-algorithm-configuration"]], "NLPGym: A toolkit to develop RL agents to solve NLP tasks": [[109, "nlpgym-a-toolkit-to-develop-rl-agents-to-solve-nlp-tasks"]], "gym-saturation: Environments used to prove theorems": [[109, "gym-saturation-environments-used-to-prove-theorems"]], "ShinRL: Environments for evaluating RL algorithms": [[109, "shinrl-environments-for-evaluating-rl-algorithms"]], "gymnax: Hardware Accelerated RL Environments": [[109, "gymnax-hardware-accelerated-rl-environments"]], "gym-anytrading: Financial trading environments for FOREX and STOCKS": [[109, "gym-anytrading-financial-trading-environments-for-forex-and-stocks"]], "gym-mtsim: Financial trading for MetaTrader 5 platform": [[109, "gym-mtsim-financial-trading-for-metatrader-5-platform"]], "openmodelica-microgrid-gym: Environments for controlling power electronic converters in microgrids": [[109, "openmodelica-microgrid-gym-environments-for-controlling-power-electronic-converters-in-microgrids"]], "mobile-env: Environments for coordination of wireless mobile networks": [[109, "mobile-env-environments-for-coordination-of-wireless-mobile-networks"]], "GymFC: A flight control tuning and training framework": [[109, "gymfc-a-flight-control-tuning-and-training-framework"]], "Toy Text": [[110, "toy-text"]], "Blackjack": [[111, "blackjack"]], "Information": [[111, "information"], [112, "information"], [113, "information"], [114, "information"]], "Cliff Walking": [[112, "cliff-walking"]], "Frozen Lake": [[113, "frozen-lake"]], "Taxi": [[114, "taxi"]], "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments": [[115, "gymnasium-is-a-standard-api-for-reinforcement-learning-and-a-diverse-collection-of-reference-environments"]], "Solving Blackjack with Q-Learning": [[116, "solving-blackjack-with-q-learning"]], "Imports and Environment Setup": [[116, "imports-and-environment-setup"]], "Observing the environment": [[116, "observing-the-environment"]], "Executing an action": [[116, "executing-an-action"]], "Building an agent": [[116, "building-an-agent"], [119, "building-an-agent"]], "Visualizing the training": [[116, "visualizing-the-training"]], "Visualising the policy": [[116, "visualising-the-policy"]], "Think you can do better?": [[116, "think-you-can-do-better"]], "Make your own custom environment": [[117, "make-your-own-custom-environment"]], "Subclassing gymnasium.Env": [[117, "subclassing-gymnasium-env"]], "Declaration and Initialization": [[117, "declaration-and-initialization"]], "Constructing Observations From Environment States": [[117, "constructing-observations-from-environment-states"]], "Reset": [[117, "reset"]], "Step": [[117, "step"]], "Rendering": [[117, "rendering"]], "Close": [[117, "close"]], "Registering Envs": [[117, "registering-envs"]], "Creating a Package": [[117, "creating-a-package"]], "Creating Environment Instances": [[117, "creating-environment-instances"]], "Using Wrappers": [[117, "using-wrappers"]], "Handling Time Limits": [[118, "handling-time-limits"]], "Termination": [[118, "termination"]], "Truncation": [[118, "truncation"]], "Importance in learning code": [[118, "importance-in-learning-code"]], "Solution": [[118, "solution"]], "Training using REINFORCE for Mujoco": [[119, "training-using-reinforce-for-mujoco"]], "Policy Network": [[119, "policy-network"]], "Plot learning curve": [[119, "plot-learning-curve"]]}, "indexentries": {"env (class in gymnasium)": [[2, "gymnasium.Env"]], "action_space (gymnasium.env attribute)": [[2, "gymnasium.Env.action_space"]], "close() (in module gymnasium.env)": [[2, "gymnasium.Env.close"]], "metadata (gymnasium.env attribute)": [[2, "gymnasium.Env.metadata"]], "np_random (gymnasium.env property)": [[2, "gymnasium.Env.np_random"]], "observation_space (gymnasium.env attribute)": [[2, "gymnasium.Env.observation_space"]], "render() (in module gymnasium.env)": [[2, "gymnasium.Env.render"]], "render_mode (gymnasium.env attribute)": [[2, "gymnasium.Env.render_mode"]], "reset() (in module gymnasium.env)": [[2, "gymnasium.Env.reset"]], "reward_range (gymnasium.env attribute)": [[2, "gymnasium.Env.reward_range"]], "spec (gymnasium.env attribute)": [[2, "gymnasium.Env.spec"]], "step() (in module gymnasium.env)": [[2, "gymnasium.Env.step"]], "unwrapped (gymnasium.env property)": [[2, "gymnasium.Env.unwrapped"]], "funcenv (class in gymnasium.experimental)": [[4, "gymnasium.experimental.FuncEnv"]], "initial() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.initial"], [4, "id0"]], "observation() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.observation"], [4, "id1"]], "render_close() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.render_close"]], "render_image() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.render_image"]], "render_init() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.render_init"]], "reward() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.reward"]], "state_info() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.state_info"]], "step_info() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.step_info"]], "terminal() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.terminal"]], "transform() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.transform"]], "transition() (in module gymnasium.experimental.funcenv)": [[4, "gymnasium.experimental.FuncEnv.transition"]], "cliprewardv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.ClipRewardV0"]], "lambdaactionv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.LambdaActionV0"]], "lambdaobservationv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.LambdaObservationV0"]], "lambdarewardv0 (class in gymnasium.experimental.wrappers)": [[7, "gymnasium.experimental.wrappers.LambdaRewardV0"]], "make() (in module gymnasium)": [[8, "gymnasium.make"]], "pprint_registry() (in module gymnasium)": [[8, "gymnasium.pprint_registry"]], "register() (in module gymnasium)": [[8, "gymnasium.register"]], "spec() (in module gymnasium)": [[8, "gymnasium.spec"]], "space (class in gymnasium.spaces)": [[9, "gymnasium.spaces.Space"]], "contains() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.contains"]], "dtype (space property)": [[9, "Space.dtype"]], "from_jsonable() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.from_jsonable"]], "sample() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.sample"]], "seed() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.seed"]], "shape (gymnasium.spaces.space.space property)": [[9, "gymnasium.spaces.space.Space.shape"]], "to_jsonable() (in module gymnasium.spaces.space.space)": [[9, "gymnasium.spaces.space.Space.to_jsonable"]], "dict (class in gymnasium.spaces)": [[10, "gymnasium.spaces.Dict"]], "graph (class in gymnasium.spaces)": [[10, "gymnasium.spaces.Graph"]], "sequence (class in gymnasium.spaces)": [[10, "gymnasium.spaces.Sequence"]], "tuple (class in gymnasium.spaces)": [[10, "gymnasium.spaces.Tuple"]], "sample() (gymnasium.spaces.dict method)": [[10, "gymnasium.spaces.Dict.sample"]], "sample() (gymnasium.spaces.graph method)": [[10, "gymnasium.spaces.Graph.sample"]], "sample() (gymnasium.spaces.sequence method)": [[10, "gymnasium.spaces.Sequence.sample"]], "sample() (gymnasium.spaces.tuple method)": [[10, "gymnasium.spaces.Tuple.sample"]], "seed() (gymnasium.spaces.dict method)": [[10, "gymnasium.spaces.Dict.seed"]], "seed() (gymnasium.spaces.graph method)": [[10, "gymnasium.spaces.Graph.seed"]], "seed() (gymnasium.spaces.sequence method)": [[10, "gymnasium.spaces.Sequence.seed"]], "seed() (gymnasium.spaces.tuple method)": [[10, "gymnasium.spaces.Tuple.seed"]], "box (class in gymnasium.spaces)": [[11, "gymnasium.spaces.Box"]], "discrete (class in gymnasium.spaces)": [[11, "gymnasium.spaces.Discrete"]], "multibinary (class in gymnasium.spaces)": [[11, "gymnasium.spaces.MultiBinary"]], "multidiscrete (class in gymnasium.spaces)": [[11, "gymnasium.spaces.MultiDiscrete"]], "text (class in gymnasium.spaces)": [[11, "gymnasium.spaces.Text"]], "is_bounded() (gymnasium.spaces.box method)": [[11, "gymnasium.spaces.Box.is_bounded"]], "sample() (gymnasium.spaces.box method)": [[11, "gymnasium.spaces.Box.sample"]], "sample() (gymnasium.spaces.discrete method)": [[11, "gymnasium.spaces.Discrete.sample"]], "sample() (gymnasium.spaces.multibinary method)": [[11, "gymnasium.spaces.MultiBinary.sample"]], "sample() (gymnasium.spaces.multidiscrete method)": [[11, "gymnasium.spaces.MultiDiscrete.sample"]], "sample() (gymnasium.spaces.text method)": [[11, "gymnasium.spaces.Text.sample"]], "seed() (gymnasium.spaces.box method)": [[11, "gymnasium.spaces.Box.seed"]], "seed() (gymnasium.spaces.discrete method)": [[11, "gymnasium.spaces.Discrete.seed"]], "seed() (gymnasium.spaces.multibinary method)": [[11, "gymnasium.spaces.MultiBinary.seed"]], "seed() (gymnasium.spaces.multidiscrete method)": [[11, "gymnasium.spaces.MultiDiscrete.seed"]], "seed() (gymnasium.spaces.text method)": [[11, "gymnasium.spaces.Text.seed"]], "flatdim() (in module gymnasium.spaces.utils)": [[12, "gymnasium.spaces.utils.flatdim"]], "flatten() (in module gymnasium.spaces.utils)": [[12, "gymnasium.spaces.utils.flatten"]], "flatten_space() (in module gymnasium.spaces.utils)": [[12, "gymnasium.spaces.utils.flatten_space"]], "unflatten() (in module gymnasium.spaces.utils)": [[12, "gymnasium.spaces.utils.unflatten"]], "batch_space() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.batch_space"]], "concatenate() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.concatenate"]], "create_empty_array() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.create_empty_array"]], "create_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.create_shared_memory"]], "iterate() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.iterate"]], "read_from_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.read_from_shared_memory"]], "write_to_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.write_to_shared_memory"]], "playplot (class in gymnasium.utils.play)": [[14, "gymnasium.utils.play.PlayPlot"]], "playablegame (class in gymnasium.utils.play)": [[14, "gymnasium.utils.play.PlayableGame"]], "callback() (gymnasium.utils.play.playplot method)": [[14, "gymnasium.utils.play.PlayPlot.callback"]], "capped_cubic_video_schedule() (in module gymnasium.utils.save_video)": [[14, "gymnasium.utils.save_video.capped_cubic_video_schedule"]], "check_env() (in module gymnasium.utils.env_checker)": [[14, "gymnasium.utils.env_checker.check_env"]], "convert_to_done_step_api() (in module gymnasium.utils.step_api_compatibility)": [[14, "gymnasium.utils.step_api_compatibility.convert_to_done_step_api"]], "convert_to_terminated_truncated_step_api() (in module gymnasium.utils.step_api_compatibility)": [[14, "gymnasium.utils.step_api_compatibility.convert_to_terminated_truncated_step_api"]], "np_random() (in module gymnasium.utils.seeding)": [[14, "gymnasium.utils.seeding.np_random"]], "play() (in module gymnasium.utils.play)": [[14, "gymnasium.utils.play.play"]], "process_event() (gymnasium.utils.play.playablegame method)": [[14, "gymnasium.utils.play.PlayableGame.process_event"]], "save_video() (in module gymnasium.utils.save_video)": [[14, "gymnasium.utils.save_video.save_video"]], "step_api_compatibility() (in module gymnasium.utils.step_api_compatibility)": [[14, "gymnasium.utils.step_api_compatibility.step_api_compatibility"]], "asyncvectorenv (class in gymnasium.vector)": [[15, "gymnasium.vector.AsyncVectorEnv"]], "syncvectorenv (class in gymnasium.vector)": [[15, "gymnasium.vector.SyncVectorEnv"]], "vectorenv (class in gymnasium.vector)": [[15, "gymnasium.vector.VectorEnv"]], "action_space": [[15, "action_space"]], "close() (gymnasium.vector.vectorenv method)": [[15, "gymnasium.vector.VectorEnv.close"]], "make() (in module gymnasium.vector)": [[15, "gymnasium.vector.make"]], "observation_space": [[15, "observation_space"]], "reset() (gymnasium.vector.vectorenv method)": [[15, "gymnasium.vector.VectorEnv.reset"]], "single_action_space": [[15, "single_action_space"]], "single_observation_space": [[15, "single_observation_space"]], "step() (gymnasium.vector.vectorenv method)": [[15, "gymnasium.vector.VectorEnv.step"]], "wrapper (class in gymnasium)": [[16, "gymnasium.Wrapper"]], "action_space (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.action_space"]], "close() (in module gymnasium.wrapper)": [[16, "gymnasium.Wrapper.close"]], "metadata (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.metadata"]], "np_random (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.np_random"]], "observation_space (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.observation_space"]], "reset() (in module gymnasium.wrapper)": [[16, "gymnasium.Wrapper.reset"]], "reward_range (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.reward_range"]], "spec (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.spec"]], "step() (in module gymnasium.wrapper)": [[16, "gymnasium.Wrapper.step"]], "unwrapped (gymnasium.wrapper property)": [[16, "gymnasium.Wrapper.unwrapped"]], "actionwrapper (class in gymnasium)": [[17, "gymnasium.ActionWrapper"]], "actionwrapper.action() (in module gymnasium.actionwrapper)": [[17, "gymnasium.ActionWrapper.ActionWrapper.action"]], "clipaction (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.ClipAction"]], "rescaleaction (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.RescaleAction"]], "ataripreprocessing (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.AtariPreprocessing"]], "autoresetwrapper (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.AutoResetWrapper"]], "envcompatibility (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.EnvCompatibility"]], "humanrendering (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.HumanRendering"]], "orderenforcing (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.OrderEnforcing"]], "passiveenvchecker (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.PassiveEnvChecker"]], "recordepisodestatistics (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.RecordEpisodeStatistics"]], "recordvideo (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.RecordVideo"]], "rendercollection (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.RenderCollection"]], "stepapicompatibility (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.StepAPICompatibility"]], "timelimit (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.TimeLimit"]], "vectorlistinfo (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.VectorListInfo"]], "filterobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.FilterObservation"]], "flattenobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.FlattenObservation"]], "framestack (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.FrameStack"]], "grayscaleobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.GrayScaleObservation"]], "normalizeobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.NormalizeObservation"]], "observationwrapper (class in gymnasium)": [[19, "gymnasium.ObservationWrapper"]], "pixelobservationwrapper (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.PixelObservationWrapper"]], "resizeobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.ResizeObservation"]], "timeawareobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.TimeAwareObservation"]], "transformobservation (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.TransformObservation"]], "observation() (in module gymnasium.observationwrapper)": [[19, "gymnasium.ObservationWrapper.observation"]], "normalizereward (class in gymnasium.wrappers)": [[20, "gymnasium.wrappers.NormalizeReward"]], "rewardwrapper (class in gymnasium)": [[20, "gymnasium.RewardWrapper"]], "rewardwrapper.reward() (in module gymnasium.rewardwrapper)": [[20, "gymnasium.RewardWrapper.RewardWrapper.reward"]], "transformreward (class in gymnasium.wrappers)": [[20, "gymnasium.wrappers.TransformReward"]]}}) \ No newline at end of file