mirror of
https://github.com/Farama-Foundation/Gymnasium.git
synced 2025-08-19 13:32:03 +00:00
1 line
184 KiB
JavaScript
1 line
184 KiB
JavaScript
Search.setIndex({"docnames": ["404", "README", "api/env", "api/registry", "api/spaces", "api/spaces/composite", "api/spaces/fundamental", "api/spaces/utils", "api/spaces/vector_utils", "api/utils", "api/vector", "api/wrappers", "api/wrappers/action_wrappers", "api/wrappers/misc_wrappers", "api/wrappers/observation_wrappers", "api/wrappers/reward_wrappers", "content/basic_usage", "content/gym_compatibility", "content/migration-guide", "environments/atari", "environments/atari/adventure", "environments/atari/air_raid", "environments/atari/alien", "environments/atari/amidar", "environments/atari/assault", "environments/atari/asterix", "environments/atari/asteroids", "environments/atari/atlantis", "environments/atari/bank_heist", "environments/atari/battle_zone", "environments/atari/beam_rider", "environments/atari/berzerk", "environments/atari/bowling", "environments/atari/boxing", "environments/atari/breakout", "environments/atari/carnival", "environments/atari/centipede", "environments/atari/chopper_command", "environments/atari/complete_list", "environments/atari/crazy_climber", "environments/atari/defender", "environments/atari/demon_attack", "environments/atari/double_dunk", "environments/atari/elevator_action", "environments/atari/enduro", "environments/atari/fishing_derby", "environments/atari/freeway", "environments/atari/frostbite", "environments/atari/gopher", "environments/atari/gravitar", "environments/atari/hero", "environments/atari/ice_hockey", "environments/atari/jamesbond", "environments/atari/journey_escape", "environments/atari/kangaroo", "environments/atari/krull", "environments/atari/kung_fu_master", "environments/atari/montezuma_revenge", "environments/atari/ms_pacman", "environments/atari/name_this_game", "environments/atari/phoenix", "environments/atari/pitfall", "environments/atari/pong", "environments/atari/pooyan", "environments/atari/private_eye", "environments/atari/qbert", "environments/atari/riverraid", "environments/atari/road_runner", "environments/atari/robotank", "environments/atari/seaquest", "environments/atari/skiing", "environments/atari/solaris", "environments/atari/space_invaders", "environments/atari/star_gunner", "environments/atari/tennis", "environments/atari/time_pilot", "environments/atari/tutankham", "environments/atari/up_n_down", "environments/atari/venture", "environments/atari/video_pinball", "environments/atari/wizard_of_wor", "environments/atari/zaxxon", "environments/box2d", "environments/box2d/bipedal_walker", "environments/box2d/car_racing", "environments/box2d/lunar_lander", "environments/classic_control", "environments/classic_control/acrobot", "environments/classic_control/cart_pole", "environments/classic_control/mountain_car", "environments/classic_control/mountain_car_continuous", "environments/classic_control/pendulum", "environments/mujoco", "environments/mujoco/ant", "environments/mujoco/half_cheetah", "environments/mujoco/hopper", "environments/mujoco/humanoid", "environments/mujoco/humanoid_standup", "environments/mujoco/inverted_double_pendulum", "environments/mujoco/inverted_pendulum", "environments/mujoco/pusher", "environments/mujoco/reacher", "environments/mujoco/swimmer", "environments/mujoco/walker2d", "environments/third_party_environments", "environments/toy_text", "environments/toy_text/blackjack", "environments/toy_text/cliff_walking", "environments/toy_text/frozen_lake", "environments/toy_text/taxi", "index", "tutorials/blackjack_tutorial", "tutorials/environment_creation", "tutorials/handling_time_limits"], "filenames": ["404.md", "README.md", "api/env.md", "api/registry.md", "api/spaces.md", "api/spaces/composite.md", "api/spaces/fundamental.md", "api/spaces/utils.md", "api/spaces/vector_utils.md", "api/utils.md", "api/vector.md", "api/wrappers.md", "api/wrappers/action_wrappers.md", "api/wrappers/misc_wrappers.md", "api/wrappers/observation_wrappers.md", "api/wrappers/reward_wrappers.md", "content/basic_usage.md", "content/gym_compatibility.md", "content/migration-guide.md", "environments/atari.md", "environments/atari/adventure.md", "environments/atari/air_raid.md", "environments/atari/alien.md", "environments/atari/amidar.md", "environments/atari/assault.md", "environments/atari/asterix.md", "environments/atari/asteroids.md", "environments/atari/atlantis.md", "environments/atari/bank_heist.md", "environments/atari/battle_zone.md", "environments/atari/beam_rider.md", "environments/atari/berzerk.md", "environments/atari/bowling.md", "environments/atari/boxing.md", "environments/atari/breakout.md", "environments/atari/carnival.md", "environments/atari/centipede.md", "environments/atari/chopper_command.md", "environments/atari/complete_list.md", "environments/atari/crazy_climber.md", "environments/atari/defender.md", "environments/atari/demon_attack.md", "environments/atari/double_dunk.md", "environments/atari/elevator_action.md", "environments/atari/enduro.md", "environments/atari/fishing_derby.md", "environments/atari/freeway.md", "environments/atari/frostbite.md", "environments/atari/gopher.md", "environments/atari/gravitar.md", "environments/atari/hero.md", "environments/atari/ice_hockey.md", "environments/atari/jamesbond.md", "environments/atari/journey_escape.md", "environments/atari/kangaroo.md", "environments/atari/krull.md", "environments/atari/kung_fu_master.md", "environments/atari/montezuma_revenge.md", "environments/atari/ms_pacman.md", "environments/atari/name_this_game.md", "environments/atari/phoenix.md", "environments/atari/pitfall.md", "environments/atari/pong.md", "environments/atari/pooyan.md", "environments/atari/private_eye.md", "environments/atari/qbert.md", "environments/atari/riverraid.md", "environments/atari/road_runner.md", "environments/atari/robotank.md", "environments/atari/seaquest.md", "environments/atari/skiing.md", "environments/atari/solaris.md", "environments/atari/space_invaders.md", "environments/atari/star_gunner.md", "environments/atari/tennis.md", "environments/atari/time_pilot.md", "environments/atari/tutankham.md", "environments/atari/up_n_down.md", "environments/atari/venture.md", "environments/atari/video_pinball.md", "environments/atari/wizard_of_wor.md", "environments/atari/zaxxon.md", "environments/box2d.md", "environments/box2d/bipedal_walker.md", "environments/box2d/car_racing.md", "environments/box2d/lunar_lander.md", "environments/classic_control.md", "environments/classic_control/acrobot.md", "environments/classic_control/cart_pole.md", "environments/classic_control/mountain_car.md", "environments/classic_control/mountain_car_continuous.md", "environments/classic_control/pendulum.md", "environments/mujoco.md", "environments/mujoco/ant.md", "environments/mujoco/half_cheetah.md", "environments/mujoco/hopper.md", "environments/mujoco/humanoid.md", "environments/mujoco/humanoid_standup.md", "environments/mujoco/inverted_double_pendulum.md", "environments/mujoco/inverted_pendulum.md", "environments/mujoco/pusher.md", "environments/mujoco/reacher.md", "environments/mujoco/swimmer.md", "environments/mujoco/walker2d.md", "environments/third_party_environments.md", "environments/toy_text.md", "environments/toy_text/blackjack.md", "environments/toy_text/cliff_walking.md", "environments/toy_text/frozen_lake.md", "environments/toy_text/taxi.md", "index.md", "tutorials/blackjack_tutorial.rst", "tutorials/environment_creation.rst", "tutorials/handling_time_limits.rst"], "titles": ["404 - Page Not Found", "Gymnasium-docs", "Env", "Registry", "Spaces", "Composite Spaces", "Fundamental Spaces", "Spaces Utils", "Spaces Vector Utils", "Utils", "Vector", "Wrappers", "Action Wrappers", "Misc Wrappers", "Observation Wrappers", "Reward Wrappers", "Basic Usage", "Compatibility with Gym", "v21 to v26 Migration Guide", "Atari", "Adventure", "Air Raid", "Alien", "Amidar", "Assault", "Asterix", "Asteroids", "Atlantis", "Bank Heist", "Battle Zone", "Beam Rider", "Berzerk", "Bowling", "Boxing", "Breakout", "Carnival", "Centipede", "Chopper Command", "Complete List - Atari", "Crazy Climber", "Defender", "Demon Attack", "Double Dunk", "Elevator Action", "Enduro", "FishingDerby", "Freeway", "Frostbite", "Gopher", "Gravitar", "Hero", "IceHockey", "Jamesbond", "JourneyEscape", "Kangaroo", "Krull", "Kung Fu Master", "Montezuma Revenge", "Ms Pacman", "Name This Game", "Phoenix", "Pitfall", "Pong", "Pooyan", "PrivateEye", "Qbert", "Riverraid", "Road Runner", "Robot Tank", "Seaquest", "Skiings", "Solaris", "SpaceInvaders", "StarGunner", "Tennis", "TimePilot", "Tutankham", "Up n\u2019 Down", "Venture", "Video Pinball", "Wizard of Wor", "Zaxxon", "Box2D", "Bipedal Walker", "Car Racing", "Lunar Lander", "Classic Control", "Acrobot", "Cart Pole", "Mountain Car", "Mountain Car Continuous", "Pendulum", "MuJoCo", "Ant", "Half Cheetah", "Hopper", "Humanoid", "Humanoid Standup", "Inverted Double Pendulum", "Inverted Pendulum", "Pusher", "Reacher", "Swimmer", "Walker2D", "Third-Party Environments", "Toy Text", "Blackjack", "Cliff Walking", "Frozen Lake", "Taxi", "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments", "Solving Blackjack with Q-Learning", "Make your own custom environment", "Handling Time Limits"], "terms": {"thi": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 109, 110, 111, 112, 113], "folder": [1, 9, 13, 100, 101], "contain": [1, 2, 4, 7, 8, 10, 11, 13, 14, 16, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 93, 94, 95, 96, 100, 101, 102, 103, 104, 106, 109, 111, 112], "If": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 25, 28, 33, 36, 45, 46, 47, 48, 49, 63, 70, 74, 83, 84, 85, 90, 93, 95, 96, 97, 101, 103, 106, 107, 108, 111, 112], "you": [1, 2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 93, 96, 97, 100, 101, 104, 110, 112, 113], "ar": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 109, 111, 112, 113], "pleas": [1, 2, 9, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109], "pr": [1, 18, 104], "repo": [1, 19], "otherwis": [1, 2, 3, 5, 6, 9, 10, 13, 14, 19, 32, 104, 111], "follow": [1, 3, 4, 9, 11, 12, 13, 15, 16, 19, 32, 42, 44, 45, 46, 47, 48, 49, 74, 87, 88, 89, 90, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 108, 111, 112, 113], "below": [1, 6, 11, 16, 45, 83, 85, 91, 100, 103, 111, 113], "directli": [1, 5, 11, 13, 16, 87, 104, 111, 112], "markdown": 1, "file": [1, 87, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 112], "repositori": [1, 11, 92, 104], "fork": [1, 18, 104, 110], "docstr": 1, "": [1, 2, 5, 6, 9, 10, 11, 12, 13, 14, 15, 16, 19, 39, 45, 46, 47, 48, 49, 51, 52, 55, 56, 57, 62, 63, 65, 82, 83, 84, 85, 86, 87, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 105, 106, 108, 109, 110, 111, 112, 113], "python": [1, 3, 8, 13, 16, 83, 84, 85, 104, 105, 110, 111, 112, 113], "Then": [1, 11, 12, 16, 69, 102], "pip": [1, 19, 82, 86, 92, 112], "instal": [1, 9, 13, 27, 82, 86, 92, 112], "your": [1, 2, 10, 11, 12, 13, 14, 15, 16, 22, 23, 25, 27, 28, 30, 32, 33, 34, 36, 42, 44, 45, 46, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 64, 65, 66, 67, 68, 69, 70, 71, 72, 75, 76, 77, 78, 79, 80, 81, 84, 93, 96, 97, 110, 111], "run": [1, 2, 3, 10, 13, 28, 50, 53, 61, 66, 67, 70, 71, 83, 85, 87, 93, 94, 95, 96, 97, 98, 99, 102, 103, 104, 112], "script": [1, 111], "gen_md": 1, "py": [1, 8, 19, 83, 84, 85, 92, 93, 96, 97, 107, 111, 112, 113], "automat": [1, 2, 3, 10, 11, 13, 17, 18, 112], "gener": [1, 2, 4, 5, 6, 9, 10, 11, 13, 14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 109, 110, 112], "For": [1, 2, 6, 7, 9, 11, 13, 14, 16, 17, 18, 19, 20, 22, 23, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 40, 50, 51, 52, 53, 54, 55, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 84, 85, 92, 108, 109, 111, 112], "add": [1, 3, 9, 10, 14, 16, 84, 92, 96, 97, 109, 111, 112], "complet": [1, 11, 13, 16, 18, 19, 39, 52, 64, 65, 84, 85, 111, 113], "ensur": [1, 2, 3, 5, 7, 9, 16, 111, 112], "i": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 109, 111, 112, 113], "ha": [1, 2, 4, 6, 7, 9, 11, 13, 14, 15, 16, 18, 19, 49, 69, 83, 84, 85, 86, 92, 93, 94, 95, 96, 97, 100, 101, 102, 103, 104, 106, 108, 110, 111, 112, 113], "properli": [1, 4], "format": [1, 4, 9, 11, 13, 14, 16], "md": [1, 112], "correspond": [1, 2, 3, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 85, 87, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 109, 112], "gif": [1, 87], "_static": 1, "video": [1, 11, 38, 68, 83], "env_typ": 1, "where": [1, 3, 5, 6, 7, 9, 11, 13, 14, 16, 18, 19, 42, 84, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 108, 109, 110, 111, 112, 113], "categori": 1, "e": [1, 2, 4, 6, 7, 8, 10, 11, 13, 14, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 100, 101, 104, 106, 111, 112], "g": [1, 2, 4, 6, 7, 8, 10, 11, 70, 87, 91, 104, 108, 109, 111, 112], "mujoco": [1, 11, 16, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "snake_cas": 1, "name": [1, 3, 11, 38, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 112], "convent": [1, 2, 19], "altern": [1, 19], "gen_gif": 1, "index": [1, 8, 9, 13, 14, 16, 19, 88, 97, 107], "toctre": 1, "requir": [1, 2, 4, 14, 92, 111], "packag": [1, 13, 104], "r": [1, 6, 13, 15, 68, 87, 91, 109], "txt": 1, "To": [1, 3, 8, 10, 13, 14, 15, 16, 17, 18, 19, 27, 37, 65, 83, 84, 85, 87, 109, 111, 112], "onc": [1, 13, 26, 36, 43, 50, 98, 101, 109, 111, 112], "cd": [1, 112], "make": [1, 2, 5, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109, 110, 111], "dirhtml": 1, "_build": 1, "rebuild": [1, 27], "everi": [1, 9, 13, 16, 36, 37, 41, 46, 68, 69, 78, 84, 85, 88, 93, 95, 96, 103, 104, 112], "time": [1, 2, 3, 5, 9, 10, 11, 19, 35, 38, 41, 42, 43, 47, 51, 53, 54, 61, 65, 66, 67, 68, 69, 70, 83, 84, 91, 93, 94, 95, 96, 97, 102, 103, 104, 107, 111, 112], "chang": [1, 2, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 47, 55, 65, 84, 87, 88, 89, 90, 91, 92, 100, 101, 104, 109, 111, 112], "made": [1, 100, 101], "sphinx": 1, "autobuild": 1, "b": [1, 6, 100, 101, 109], "we": [1, 2, 6, 13, 14, 15, 16, 18, 19, 93, 96, 97, 104, 111, 112, 113], "us": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 111, 113], "galleri": 1, "insid": [1, 5, 6, 13, 112], "directori": 1, "check": [1, 2, 6, 13, 104, 109, 111, 112], "demo": 1, "see": [1, 2, 4, 9, 10, 16, 18, 19, 20, 23, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 40, 50, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 85, 87, 93, 94, 95, 96, 102, 103, 104, 112], "exampl": [1, 2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 84, 87, 104, 106, 107, 108, 111, 112, 113], "more": [1, 2, 4, 5, 6, 9, 10, 11, 14, 18, 19, 20, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 40, 45, 50, 51, 52, 53, 54, 55, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 83, 85, 92, 93, 96, 97, 98, 99, 100, 101, 102, 111, 112, 113], "inform": [1, 2, 4, 5, 6, 9, 10, 11, 13, 14, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109, 111, 112, 113], "convert": [1, 3, 4, 5, 11, 13, 14, 17, 18, 84, 104, 111], "jupyer": 1, "notebook": [1, 111, 112, 113], "can": [1, 2, 3, 4, 5, 6, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 108, 109, 112], "want": [1, 2, 5, 10, 11, 12, 13, 15, 16, 28, 50, 111, 112], "execut": [1, 9, 12, 19, 42, 109, 112], "which": [1, 2, 3, 4, 5, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 39, 41, 43, 57, 84, 85, 87, 88, 92, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103, 104, 108, 109, 112, 113], "output": [1, 8, 9, 13, 16, 111], "plot": [1, 9, 111], "should": [1, 2, 4, 6, 9, 10, 13, 14, 16, 18, 100, 101, 111, 112], "start": [1, 2, 4, 6, 9, 10, 13, 29, 42, 43, 49, 53, 54, 69, 104, 106, 107, 108, 109, 111], "run_": 1, "note": [1, 4, 8, 13, 87, 88, 93, 96, 97, 109, 111, 113], "so": [1, 9, 10, 11, 13, 14, 16, 19, 47, 70, 85, 86, 93, 94, 95, 96, 97, 98, 99, 102, 103, 104, 111, 112, 113], "sure": [1, 2, 13, 112], "doesn": [1, 2, 3, 11, 13, 19, 85, 113], "t": [1, 2, 3, 5, 6, 7, 9, 11, 13, 14, 15, 18, 19, 35, 45, 46, 47, 48, 49, 68, 69, 84, 85, 89, 90, 111, 112, 113], "take": [1, 2, 3, 6, 7, 9, 10, 11, 12, 13, 16, 18, 19, 72, 86, 88, 90, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 108, 109, 111], "than": [1, 18, 45, 51, 69, 85, 87, 88, 89, 90, 94, 98, 99, 100, 102, 104, 106, 111], "few": [1, 87, 111], "second": [1, 5, 9, 10, 32, 63, 70, 85, 94, 98, 101, 102], "class": [2, 4, 5, 6, 9, 10, 11, 12, 13, 14, 15, 16, 92, 111, 112], "The": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 109, 110, 111, 112, 113], "main": [2, 85, 95, 103], "reinforc": [2, 4, 16, 87, 102, 105, 106, 107, 109, 111, 113], "learn": [2, 4, 5, 13, 14, 15, 16, 19, 45, 46, 47, 48, 49, 83, 84, 85, 87, 88, 89, 90, 94, 97, 98, 99, 102, 105, 106, 107, 109, 112], "agent": [2, 4, 11, 13, 14, 16, 18, 19, 43, 52, 83, 84, 85, 89, 93, 94, 95, 96, 97, 98, 99, 102, 103, 107, 108, 109, 112, 113], "encapsul": 2, "an": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 100, 101, 102, 103, 104, 106, 107, 109, 112, 113], "arbitrari": [2, 3, 6, 9, 14, 15, 104], "behind": [2, 63], "scene": [2, 63, 104], "dynam": [2, 19, 34, 45, 46, 47, 48, 49, 87, 91, 92, 98, 104], "through": [2, 3, 4, 10, 17, 18, 19, 34, 50, 53, 56, 57, 61, 70, 71, 96, 97, 104, 113], "step": [2, 3, 10, 11, 12, 13, 14, 15, 16, 19, 83, 85, 87, 88, 91, 107, 109, 110, 111, 112, 113], "reset": [2, 3, 9, 10, 11, 12, 13, 14, 15, 16, 87, 88, 89, 90, 91, 104, 109, 110, 111, 112], "function": [2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 85, 91, 101, 104, 108, 109, 111, 113], "partial": 2, "fulli": [2, 104], "observ": [2, 4, 5, 8, 9, 10, 11, 12, 13, 15, 18, 104, 110, 112, 113], "singl": [2, 4, 5, 6, 7, 8, 9, 10, 14, 16, 95, 96, 97, 103, 112], "multi": [2, 6, 92, 96, 97, 100], "pettingzoo": 2, "api": [2, 11, 13, 16, 18, 104, 112, 113], "user": [2, 3, 10, 16, 18, 19, 87, 88, 89, 90, 91, 104, 112], "need": [2, 3, 4, 5, 9, 11, 12, 13, 14, 16, 18, 37, 39, 44, 50, 54, 64, 69, 83, 85, 88, 92, 111, 112, 113], "know": [2, 13, 16, 112], "updat": [2, 9, 13, 14, 16, 17, 18, 109, 111, 112, 113], "action": [2, 3, 4, 5, 6, 9, 10, 11, 13, 18, 38, 86, 104, 105, 110, 112], "return": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103, 107, 109, 111, 112, 113], "next": [2, 8, 16, 18, 39, 41, 43], "reward": [2, 3, 9, 10, 11, 13, 16, 18, 92, 104, 110, 111, 112, 113], "termin": [2, 3, 9, 10, 11, 13, 15, 16, 17, 18, 87, 88, 89, 90, 93, 95, 96, 97, 98, 99, 100, 101, 103, 107, 110, 111, 112], "truncat": [2, 3, 9, 10, 11, 13, 15, 16, 17, 18, 87, 88, 89, 90, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 110, 111, 112], "due": [2, 18, 108, 113], "latest": 2, "from": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 21, 35, 42, 47, 48, 51, 53, 62, 63, 75, 81, 83, 84, 85, 87, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 111, 112, 113], "about": [2, 9, 14, 16, 64, 87, 93, 96, 97, 111, 112, 113], "metric": [2, 9, 18], "debug": [2, 4, 9, 105], "info": [2, 9, 10, 11, 14, 15, 16, 18, 93, 94, 95, 96, 100, 101, 102, 103, 110, 111, 112, 113], "initi": [2, 3, 5, 6, 10, 11, 12, 13, 14, 15, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 109, 111], "state": [2, 11, 13, 14, 16, 18, 19, 86, 92, 104, 105, 107, 109, 111, 112, 113], "befor": [2, 3, 9, 10, 11, 12, 13, 14, 15, 27, 39, 53, 64, 71, 72, 84, 93, 94, 95, 96, 97, 98, 99, 101, 102, 103, 112], "call": [2, 3, 7, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 32, 51, 100, 101, 106, 108, 111, 112], "first": [2, 9, 10, 11, 13, 14, 16, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 109, 111, 112], "episod": [2, 3, 9, 11, 14, 18, 107, 109, 111, 112, 113], "render": [2, 10, 11, 14, 16, 19, 82, 83, 93, 94, 95, 96, 97, 98, 99, 102, 103, 104, 111, 112], "help": [2, 4, 16, 22, 54, 57, 100, 104, 111], "visualis": [2, 16], "what": [2, 4, 13, 19, 109], "mode": [2, 10, 11, 13, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 111, 112], "human": [2, 5, 11, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 84, 96, 97, 100, 104, 110, 112], "rgb_arrai": [2, 9, 11, 13, 14, 19, 112], "ansi": [2, 112], "text": [2, 4, 5, 7, 16, 106, 107, 108, 109], "close": [2, 6, 9, 10, 11, 16, 18, 39, 64, 93, 95, 96, 101, 103, 110, 111, 112], "import": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109, 110, 112], "when": [2, 4, 5, 7, 8, 9, 10, 11, 13, 14, 15, 17, 19, 22, 35, 39, 40, 41, 43, 45, 46, 47, 48, 49, 51, 52, 66, 67, 68, 69, 72, 84, 85, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 107, 109, 112, 113], "extern": [2, 18, 93, 96, 97, 113], "softwar": [2, 104], "pygam": [2, 9, 18, 82, 104, 112], "databas": 2, "have": [2, 3, 6, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 25, 27, 28, 32, 34, 36, 37, 39, 40, 45, 46, 47, 48, 49, 50, 53, 54, 55, 59, 61, 63, 69, 71, 82, 83, 84, 87, 93, 94, 95, 96, 97, 99, 100, 102, 103, 104, 106, 109, 111, 112, 113], "understand": [2, 7, 10, 100, 104], "action_spac": [2, 9, 10, 11, 12, 14, 15, 16, 18, 109, 110, 111, 112], "space": [2, 9, 10, 11, 12, 13, 14, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 92, 104, 105, 107, 109, 112], "object": [2, 4, 8, 11, 16, 20, 25, 39, 45, 46, 54, 66, 72, 100, 104, 111], "valid": [2, 3, 4, 6, 8, 10, 11, 12, 13, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 111], "all": [2, 5, 6, 10, 11, 13, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 46, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 87, 88, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 111], "within": [2, 4, 12, 14, 16, 18, 57, 61, 85, 86, 98, 99, 104], "observation_spac": [2, 5, 6, 10, 11, 14, 16, 112], "reward_rang": [2, 11, 15], "A": [2, 4, 5, 6, 7, 9, 10, 12, 13, 14, 15, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 87, 88, 90, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103, 108, 111, 112, 113], "tupl": [2, 4, 6, 7, 8, 9, 11, 14, 16, 18, 19, 93, 95, 96, 103, 106, 109, 111, 112], "minimum": [2, 6, 91], "maximum": [2, 3, 6, 9, 13, 16, 68, 69, 85, 87, 91, 98, 104, 112], "possibl": [2, 5, 6, 7, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 85, 87, 88, 89, 90, 94, 96, 98, 99, 102, 103, 104, 107, 108, 109, 111, 112], "over": [2, 8, 13, 15, 22, 28, 51, 61, 66, 94, 96, 106, 108, 111], "default": [2, 3, 4, 5, 6, 9, 10, 11, 13, 14, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 84, 87, 91, 93, 94, 95, 96, 100, 101, 102, 103, 104, 112, 113], "rang": [2, 8, 9, 11, 12, 13, 15, 16, 17, 18, 19, 51, 83, 86, 87, 88, 89, 90, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 110, 111, 112], "set": [2, 5, 6, 10, 11, 12, 13, 14, 18, 19, 20, 21, 22, 23, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 77, 78, 79, 80, 82, 85, 86, 87, 89, 90, 92, 93, 94, 95, 96, 100, 101, 102, 103, 104, 111, 112, 113], "infti": [2, 6], "spec": [2, 10, 11, 13], "metadata": [2, 9, 11, 13, 19, 112], "fp": [2, 9, 19, 112], "np_random": [2, 9, 11, 13, 18, 112], "random": [2, 4, 5, 6, 9, 13, 14, 16, 19, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 101, 102, 103, 104, 108, 109, 111, 112], "number": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 14, 16, 17, 19, 21, 22, 23, 24, 25, 26, 27, 30, 31, 32, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 53, 56, 58, 59, 60, 62, 63, 65, 68, 70, 72, 73, 75, 76, 77, 79, 80, 84, 85, 87, 95, 96, 97, 102, 103, 106, 108, 112], "assign": [2, 70, 88, 89, 90, 100, 101], "dure": [2, 5, 6, 10, 11, 13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 87, 93, 94, 95, 96, 102, 103, 109, 112], "super": [2, 11, 12, 14, 15, 18, 112], "seed": [2, 3, 4, 5, 6, 10, 16, 67, 110, 112], "assess": 2, "self": [2, 4, 5, 11, 12, 13, 14, 15, 90, 104, 111, 112], "modifi": [2, 4, 10, 11, 12, 14, 15, 18, 87, 100, 101, 109, 112], "extend": 2, "wrapper": [2, 3, 5, 6, 9, 10, 16, 17, 18, 100, 101, 104, 110, 111], "acttyp": [2, 9, 11], "obstyp": [2, 9, 11, 18], "float": [2, 3, 7, 9, 11, 12, 14, 15, 19, 50, 63, 85, 93, 94, 95, 96, 102, 103, 104, 111, 112], "bool": [2, 3, 4, 6, 9, 10, 11, 13, 14, 18, 19, 85, 93, 94, 95, 96, 102, 103, 111, 112], "dict": [2, 4, 6, 7, 8, 9, 10, 11, 13, 14, 16, 18, 112], "one": [2, 5, 6, 7, 9, 10, 11, 13, 14, 16, 17, 18, 21, 22, 23, 27, 32, 39, 42, 43, 55, 64, 65, 66, 68, 69, 74, 87, 88, 89, 90, 91, 93, 95, 97, 98, 99, 101, 102, 104, 106, 109, 111, 113], "timestep": [2, 13, 14, 16, 89, 90, 93, 95, 96, 97, 98, 99, 100, 101, 103, 112], "end": [2, 11, 13, 16, 27, 36, 37, 39, 41, 43, 44, 52, 53, 54, 64, 68, 71, 72, 83, 91, 104, 107, 109, 111, 113], "reach": [2, 11, 27, 29, 39, 42, 43, 60, 63, 71, 72, 86, 87, 88, 89, 90, 93, 95, 96, 97, 98, 99, 100, 101, 103, 104, 107, 108, 109, 111, 112, 113], "necessari": [2, 4, 19, 45, 46, 47, 48, 49], "version": [2, 3, 4, 11, 88, 111, 112, 113], "0": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109, 111, 112, 113], "26": [2, 17, 93, 96, 97, 112, 113], "wa": [2, 9, 10, 11, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 93, 94, 95, 96, 102, 103, 113], "remov": [2, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 87, 109], "done": [2, 3, 9, 11, 13, 16, 17, 18, 93, 95, 96, 97, 98, 99, 103, 111, 112, 113], "favor": 2, "clearer": 2, "had": 2, "critic": [2, 13], "bootstrap": [2, 18, 113], "algorithm": [2, 4, 92, 104, 105, 109, 111, 113], "paramet": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 85, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 102, 103, 112], "provid": [2, 4, 5, 6, 9, 10, 11, 12, 13, 14, 16, 17, 19, 25, 39, 41, 45, 46, 47, 48, 49, 83, 87, 104, 112], "element": [2, 4, 5, 6, 8, 10, 14, 16, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 108, 112], "numpi": [2, 4, 6, 8, 10, 11, 12, 14, 18, 104, 107, 111, 112], "arrai": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 85, 104, 111, 112], "posit": [2, 5, 6, 7, 8, 9, 13, 14, 16, 19, 30, 51, 83, 84, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 111, 112], "veloc": [2, 5, 7, 8, 83, 85, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "pole": [2, 70, 86, 98, 99, 104], "cartpol": [2, 3, 9, 10, 13, 14, 15, 16, 86, 88, 98, 99, 104], "result": [2, 7, 9, 10, 16, 87, 93, 96, 97, 105, 107, 109, 111], "whether": [2, 3, 6, 9, 13, 18, 32, 85, 93, 94, 95, 96, 102, 103, 106, 111, 112, 113], "defin": [2, 4, 7, 11, 12, 13, 14, 15, 16, 91, 96, 112, 113], "under": [2, 14, 15, 104, 111], "mdp": [2, 13, 16, 89, 90], "task": [2, 5, 11, 14, 16, 55, 61, 64, 84, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 107, 112, 113], "neg": [2, 6, 9, 16, 70, 90, 93, 94, 96, 97, 98, 100, 101], "goal": [2, 22, 25, 30, 32, 34, 36, 39, 51, 56, 57, 58, 59, 60, 62, 65, 67, 69, 70, 76, 77, 78, 79, 80, 81, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 109, 112], "move": [2, 11, 15, 16, 18, 21, 24, 25, 34, 35, 49, 52, 63, 66, 69, 70, 83, 85, 88, 93, 94, 95, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 112, 113], "lava": [2, 16, 50], "sutton": [2, 87, 88, 98, 99, 106, 107, 111], "barton": 2, "gridworld": [2, 107, 112], "true": [2, 3, 7, 9, 10, 12, 13, 14, 16, 17, 19, 45, 46, 47, 48, 49, 83, 84, 85, 93, 94, 95, 96, 102, 103, 106, 108, 111, 112], "condit": [2, 111, 113], "outsid": [2, 84, 85, 113], "scope": [2, 113], "satisfi": 2, "typic": [2, 9, 104, 109], "timelimit": [2, 3, 11, 13, 16, 112, 113], "could": [2, 9, 14, 15, 16, 19, 111, 112, 113], "also": [2, 3, 6, 9, 10, 11, 13, 14, 16, 19, 31, 52, 53, 64, 65, 67, 83, 84, 85, 86, 92, 93, 94, 95, 96, 102, 103, 104, 111, 112, 113], "indic": [2, 9, 13, 18, 84, 87, 88, 93, 96, 97, 109, 111, 113], "physic": [2, 82, 92, 98, 99, 104], "go": [2, 43, 70, 74, 84, 106, 111, 113], "out": [2, 8, 19, 28, 33, 50, 53, 61, 66, 71, 104, 112, 113], "bound": [2, 6, 11, 12, 16, 18, 85, 87, 88, 89, 90, 91, 113], "prematur": 2, "auxiliari": [2, 112], "diagnost": 2, "log": 2, "might": [2, 4, 6, 7, 11, 12, 13, 14, 15, 18, 104, 111, 112], "instanc": [2, 3, 4, 5, 7, 8, 9, 10, 11, 13, 15, 16, 104], "describ": [2, 5, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 87, 88, 102, 104, 106], "perform": [2, 9, 13, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 101, 104], "variabl": [2, 4, 6, 10, 13, 95, 102, 103, 104, 111, 112, 113], "hidden": [2, 92, 104], "individu": [2, 11, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 112], "term": [2, 11, 86, 87, 92, 93, 94, 95, 96, 100, 101, 102, 103, 112], "combin": [2, 4, 9, 11, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 50, 51, 52, 53, 54, 55, 56, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 101], "produc": [2, 11, 13, 97, 112], "total": [2, 39, 83, 84, 85, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103, 109], "In": [2, 6, 9, 10, 11, 12, 14, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 84, 86, 87, 93, 94, 95, 96, 102, 103, 104, 107, 109, 111, 112, 113], "openai": [2, 3, 10, 11, 16, 18, 82, 104, 110, 111, 113], "gym": [2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 82, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109, 110, 111, 112, 113], "v26": 2, "distinguish": [2, 112, 113], "howev": [2, 3, 4, 5, 6, 7, 10, 11, 12, 13, 14, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 87, 93, 94, 95, 96, 100, 101, 109, 111, 112, 113], "deprec": 2, "favour": [2, 17, 18], "boolean": [2, 4, 9, 13, 18, 85, 111], "valu": [2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 16, 18, 19, 69, 83, 85, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 108, 109, 111, 113], "case": [2, 4, 5, 6, 11, 12, 14, 16, 18, 52, 64, 84, 93, 94, 95, 96, 102, 103, 109, 112, 113], "further": [2, 18, 69, 85, 100, 101], "undefin": 2, "signal": [2, 11, 13, 16, 93, 95, 96, 103, 109, 112, 113], "mai": [2, 6, 9, 10, 12, 13, 14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 93, 94, 95, 96, 102, 103, 108, 112], "emit": [2, 11, 13], "differ": [2, 4, 5, 9, 10, 11, 12, 13, 14, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 84, 91, 93, 94, 95, 96, 97, 98, 99, 103, 104, 112, 113], "reason": [2, 18, 85, 104], "mayb": 2, "underli": [2, 11, 13, 16, 87], "solv": [2, 83, 86, 88, 92, 98, 99, 112], "successfulli": 2, "certain": [2, 42, 44, 98, 99, 101, 111], "exceed": [2, 11, 13, 16, 93, 95, 96, 103, 111], "simul": [2, 19, 45, 46, 47, 48, 49, 92, 96, 97, 98, 99, 104, 111], "enter": [2, 9, 26, 28, 55, 85], "invalid": [2, 6, 111], "option": [2, 3, 4, 5, 6, 9, 10, 11, 13, 14, 16, 18, 84, 87, 88, 89, 90, 91, 112], "int": [2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 19, 111, 112], "none": [2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14, 18, 108, 111, 112], "intern": [2, 10, 14], "new": [2, 4, 11, 12, 13, 14, 16, 17, 18, 23, 26, 28, 41, 87, 88, 89, 90, 91, 101, 104, 111, 112, 113], "often": [2, 4, 92, 112], "some": [2, 4, 5, 6, 10, 11, 13, 14, 15, 16, 18, 19, 35, 43, 61, 84, 86, 87, 92, 101, 102, 104, 109, 111, 112], "explor": [2, 4, 49, 104, 111], "generalis": 2, "polici": [2, 14, 15, 16, 18, 86, 92, 93, 94, 95, 96, 97, 102, 103, 104, 110, 113], "control": [2, 4, 6, 15, 16, 18, 19, 21, 24, 26, 27, 28, 29, 30, 35, 37, 40, 47, 48, 49, 52, 54, 61, 62, 64, 66, 67, 68, 69, 70, 71, 74, 75, 82, 84, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "alreadi": [2, 11, 14, 16], "rng": [2, 4, 5, 6, 112], "therefor": [2, 4, 10, 18], "right": [2, 6, 19, 21, 23, 24, 25, 26, 30, 34, 35, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 52, 53, 54, 56, 58, 59, 60, 62, 65, 70, 72, 73, 75, 76, 79, 80, 83, 84, 85, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 102, 103, 107, 108, 109, 111, 112], "after": [2, 3, 9, 10, 13, 14, 16, 27, 31, 36, 42, 46, 50, 72, 85, 93, 94, 95, 96, 97, 102, 103, 104, 106, 109, 111, 112, 113], "never": 2, "again": [2, 85, 112], "custom": [2, 4, 9, 10, 14, 16, 18, 19, 45, 46, 47, 48, 49, 102, 104, 108], "line": [2, 18, 42, 87, 112], "correctli": [2, 14, 15, 112], "v0": [2, 3, 10, 11, 13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109, 112, 113], "25": [2, 19, 45, 46, 47, 48, 49, 93, 95, 96, 97, 103, 109], "return_info": 2, "now": [2, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 111, 112, 113], "expect": [2, 4, 5, 6, 10, 13, 16], "prng": [2, 4, 5, 6], "doe": [2, 3, 5, 7, 9, 10, 11, 13, 17, 31, 47, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 112, 113], "pass": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 84, 85, 93, 94, 95, 96, 102, 103, 112], "chosen": [2, 6, 19], "sourc": [2, 92, 104, 111, 112, 113], "entropi": 2, "timestamp": 2, "dev": 2, "urandom": 2, "integ": [2, 5, 6, 9, 13, 14, 18, 19, 109, 112], "even": [2, 3, 20, 22, 28, 29, 31, 33, 36, 37, 40, 50, 51, 52, 54, 55, 57, 61, 64, 66, 67, 68, 69, 71, 74, 78, 81, 97, 111, 112], "exist": [2, 3, 4, 10, 11, 16], "usual": [2, 5, 6, 11, 13, 19, 45, 46, 47, 48, 49, 51, 95, 111, 112], "been": [2, 9, 13, 16, 18, 93, 96, 97, 104, 112, 113], "refer": [2, 9, 13, 16, 18, 112, 113], "minim": [2, 112, 113], "abov": [2, 5, 6, 9, 17, 18, 19, 45, 46, 47, 48, 49, 87, 88, 91, 92], "paradigm": 2, "specifi": [2, 4, 5, 6, 9, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 91, 95, 96, 100, 101, 103, 104, 105, 108, 109, 112], "how": [2, 4, 9, 10, 16, 51, 53, 54, 97, 98, 100, 101, 111, 112, 113], "depend": [2, 5, 9, 14, 15, 19, 21, 22, 23, 24, 25, 26, 27, 30, 31, 32, 34, 35, 37, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 53, 54, 56, 58, 59, 60, 62, 63, 65, 70, 72, 73, 75, 76, 77, 79, 80, 82, 86, 88, 92, 93, 94, 95, 96, 102, 103, 104, 108], "specif": [2, 3, 6, 13, 113], "analog": [2, 19], "dictionari": [2, 4, 5, 9, 10, 11, 13, 14, 16, 109, 111, 112], "complement": 2, "It": [2, 3, 5, 6, 9, 10, 11, 13, 16, 19, 20, 21, 22, 23, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 50, 51, 52, 53, 54, 55, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 77, 78, 79, 80, 83, 92, 93, 94, 95, 96, 97, 100, 101, 102, 103, 104, 107, 111, 112], "union": [2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 14], "renderfram": [2, 9], "list": [2, 4, 5, 6, 9, 10, 11, 14, 16, 19, 104, 111], "comput": [2, 9, 62, 74, 93, 98, 100, 101, 104, 111, 112], "frame": [2, 9, 13, 14, 19, 32, 84, 85, 97, 100], "render_mod": [2, 9, 10, 11, 13, 14, 16, 18, 19, 110, 112], "wai": [2, 5, 11, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 104, 111, 113], "most": [2, 4, 11, 13, 14, 16, 18, 19, 45, 46, 47, 48, 49, 101, 104, 111, 112], "achiev": [2, 19, 22, 87, 106], "appli": [2, 3, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, 83, 85, 86, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 111, 112], "collect": [2, 10, 22, 25, 43, 57, 58, 61, 77, 104, 111], "As": [2, 10, 11, 16, 75, 87, 92, 93, 94, 96, 97, 105, 109], "known": [2, 13, 26], "__init__": [2, 5, 8, 11, 12, 14, 15, 111, 112], "initialis": [2, 13, 18], "By": [2, 3, 13, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 87, 93, 94, 95, 96, 102, 103], "continu": [2, 4, 11, 12, 16, 24, 25, 84, 85, 86, 89, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 111, 113], "current": [2, 6, 9, 11, 13, 14, 19, 84, 87, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109, 111, 112], "displai": [2, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 88, 104, 112], "consumpt": 2, "occur": [2, 13, 87, 88, 112], "repres": [2, 5, 6, 9, 16, 18, 85, 87, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 108, 109, 110, 112], "np": [2, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 85, 109, 111, 112], "ndarrai": [2, 3, 5, 6, 7, 8, 9, 12, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 109], "shape": [2, 4, 5, 6, 7, 8, 11, 12, 13, 14, 16, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 112], "x": [2, 4, 6, 7, 85, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103, 104, 112], "y": [2, 6, 19, 85, 91, 93, 94, 96, 97, 98, 100, 101, 102, 109], "3": [2, 5, 6, 7, 8, 9, 10, 13, 14, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109, 111, 112], "rgb": [2, 11, 13, 14, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 84, 93, 94, 95, 96, 97, 98, 99, 102, 103], "pixel": [2, 11, 84, 104, 112], "imag": [2, 4, 10, 11, 13, 14, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 84, 104], "string": [2, 4, 6, 9, 14], "str": [2, 3, 4, 5, 6, 7, 9, 10, 13, 14, 18, 19, 93, 94, 95, 96, 102, 103, 111], "stringio": [2, 105], "style": [2, 10, 13, 104], "represent": [2, 16, 113], "each": [2, 3, 4, 5, 6, 9, 10, 11, 12, 14, 16, 19, 39, 41, 42, 43, 44, 47, 55, 62, 64, 65, 66, 67, 68, 69, 70, 82, 83, 85, 86, 87, 88, 89, 90, 93, 96, 97, 98, 99, 100, 104, 105, 107, 109, 111, 112], "includ": [2, 3, 14, 16, 17, 18, 19, 88, 93, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 109, 112, 113], "newlin": 2, "escap": [2, 38, 53, 57], "sequenc": [2, 3, 4, 6, 7, 10, 14, 16, 19, 104], "color": [2, 5, 23, 34, 47, 65], "rgb_array_list": [2, 9, 11, 13], "ansi_list": 2, "base": [2, 4, 5, 10, 11, 12, 13, 14, 15, 16, 43, 52, 69, 82, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 109, 111, 112], "except": [2, 66, 69, 112], "rendercollect": [2, 11, 13], "pop": [2, 101], "kei": [2, 3, 4, 5, 6, 9, 10, 11, 13, 14, 16, 19, 20, 51, 93, 94, 95, 96, 100, 101, 102, 103, 104, 109, 111, 112, 113], "support": [2, 4, 5, 7, 9, 10, 11, 13, 14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 87, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 112], "longer": [2, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 93, 95, 96, 97, 98, 99, 100, 101, 103, 104], "accept": [2, 9, 13, 19, 112], "rather": [2, 18, 84, 104, 111], "v1": [2, 3, 9, 10, 13, 14, 15, 16, 83, 84, 85, 87, 88, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 108, 109, 111], "type": [2, 4, 5, 6, 10, 11, 12, 14, 16, 18, 41, 84, 93, 94, 95, 96, 102, 103, 104, 112], "discret": [2, 4, 5, 7, 8, 10, 12, 14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 84, 85, 87, 88, 89, 90, 104, 105, 106, 107, 108, 109, 111, 112], "give": [2, 22, 23, 41, 42, 85, 100, 106, 109, 111], "2": [2, 5, 6, 7, 8, 9, 10, 12, 14, 15, 19, 20, 21, 23, 24, 25, 26, 27, 29, 30, 32, 34, 35, 37, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 53, 56, 58, 59, 60, 62, 63, 65, 70, 72, 73, 74, 75, 76, 77, 79, 80, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 109, 111, 112], "mean": [2, 16, 18, 87, 93, 94, 95, 100, 112], "two": [2, 5, 6, 9, 10, 13, 18, 19, 21, 32, 74, 83, 85, 87, 89, 90, 92, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103, 106, 111, 112], "1": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109, 111, 112, 113], "box": [2, 4, 5, 7, 8, 10, 11, 12, 14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 112], "4028234663852886e": 2, "38": [2, 96, 97], "4": [2, 6, 7, 9, 10, 11, 12, 13, 14, 16, 19, 21, 23, 24, 25, 26, 28, 30, 32, 34, 35, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 53, 56, 58, 59, 60, 62, 63, 64, 65, 72, 73, 75, 76, 77, 79, 80, 83, 85, 87, 88, 89, 90, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 107, 108, 109, 111, 112], "float32": [2, 5, 6, 7, 8, 10, 11, 12, 14, 16, 83, 84, 85, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "denot": [2, 88], "well": [2, 4, 26, 69, 87, 93, 96, 97, 104, 112], "high": [2, 5, 6, 7, 8, 10, 14, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "8000002e": 2, "00": 2, "4028235e": 2, "1887903e": 2, "01": [2, 15, 85, 93, 94, 97, 98, 99, 100, 101, 102, 111], "dtype": [2, 4, 5, 6, 8, 10, 14, 85, 112], "low": [2, 5, 6, 7, 8, 14, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "ani": [2, 4, 5, 8, 9, 13, 14, 18, 19, 41, 45, 46, 47, 48, 49, 50, 68, 85, 88, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 108, 111, 112, 113], "etc": [2, 4, 11, 64, 67, 71, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 112, 113], "determin": [2, 6, 19, 85, 87, 88, 89, 90, 91, 104, 112, 113], "inf": [2, 14, 88, 89, 90, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "envspec": [2, 3], "normal": [2, 6, 11, 13, 83, 84, 91, 93, 94, 98], "finish": [2, 84, 85], "code": [2, 4, 5, 9, 10, 11, 13, 14, 15, 87, 104, 111, 112], "clean": 2, "up": [2, 5, 6, 10, 14, 19, 20, 22, 23, 24, 25, 26, 28, 29, 30, 32, 35, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 52, 53, 56, 58, 63, 65, 66, 67, 69, 70, 73, 74, 75, 76, 79, 80, 83, 85, 92, 93, 96, 97, 101, 106, 107, 108, 109, 111, 112], "window": [2, 9, 39, 84, 112], "http": [2, 9, 11, 19, 84, 87, 104, 106, 107, 111, 112], "connect": [2, 5, 87, 93, 94, 95, 101, 102, 103], "properti": [2, 4, 11, 113], "unwrap": [2, 11, 16, 87], "non": [2, 4, 7, 9, 112, 113], "wrap": [2, 3, 9, 10, 11, 12, 13, 14, 15, 16, 112], "_np_random": 2, "meth": 2, "much": [2, 19, 45, 46, 47, 48, 49, 53, 54, 97, 112, 113], "creat": [2, 3, 6, 8, 9, 10, 13, 16, 29, 83, 84, 85, 100, 101, 104, 105, 111], "creation": [2, 10, 112], "tutori": [2, 16, 18, 111], "gymnasium": [3, 4, 5, 6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 109, 111, 113], "allow": [3, 4, 5, 9, 11, 12, 14, 15, 16, 17, 18, 19, 50, 68, 87, 88, 89, 90, 91, 98, 99, 100, 101, 112], "load": 3, "pre": 3, "sever": [3, 6, 11, 13, 16, 18, 19, 49, 104], "id": [3, 10, 108, 112], "kwarg": [3, 9, 10, 11, 17, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 112], "env": [3, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 107, 108, 109, 110, 111, 113], "liter": 3, "mountaincar": [3, 89], "mountaincarcontinu": [3, 90], "supportsfloat": [3, 6, 11, 18], "pendulum": [3, 10, 14, 16, 86, 87, 88, 92], "acrobot": [3, 86], "lunarland": [3, 13, 16, 18, 85, 110], "v2": [3, 12, 13, 16, 18, 83, 84, 85, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 109, 110], "lunarlandercontinu": [3, 12], "bipedalwalk": [3, 11, 12, 16, 83], "v3": [3, 11, 12, 16, 83, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 109], "bipedalwalkerhardcor": 3, "carrac": [3, 9, 14, 84], "blackjack": [3, 16, 105], "frozenlak": [3, 9, 108], "frozenlake8x8": 3, "cliffwalk": [3, 107], "taxi": [3, 105], "reacher": [3, 11, 92, 100], "v4": [3, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "pusher": 3, "invertedpendulum": [3, 92, 98, 99], "inverteddoublependulum": [3, 98], "halfcheetah": [3, 92, 94], "hopper": [3, 92, 103], "swimmer": [3, 92], "walker2d": [3, 92], "ant": [3, 92, 95, 103], "humanoidstandup": [3, 92, 97], "humanoid": [3, 40, 92, 93], "accord": [3, 5, 6, 10, 85], "given": [3, 6, 11, 14, 66, 69, 83, 85, 86, 87, 89, 90, 93, 95, 96, 103, 111, 113], "find": [3, 19, 20, 45, 46, 47, 48, 49, 55, 64, 76, 98, 101, 104, 112], "avail": [3, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 85, 104, 112], "modul": [3, 8, 112], "eg": [3, 9, 112], "max_episode_step": [3, 13, 112], "length": [3, 5, 6, 9, 11, 13, 14, 83, 87, 88, 89, 90, 94, 102, 104, 111], "autoreset": [3, 10, 112], "autoresetwrapp": [3, 11, 13, 112], "apply_api_compat": [3, 13, 17], "stepapicompat": [3, 11, 13, 17], "argument": [3, 4, 5, 6, 7, 9, 10, 14, 16, 17, 82, 86, 105, 111, 112], "fals": [3, 9, 10, 13, 14, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 84, 85, 93, 94, 95, 96, 102, 103, 106, 108, 111, 112], "disable_env_check": [3, 10], "checker": [3, 10], "addit": [3, 4, 10, 11, 13, 16, 18, 19, 25, 36, 66, 70, 85, 86, 87, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 109, 111, 112], "constructor": [3, 4, 5, 6, 9, 11, 16, 112], "rais": [3, 6, 7, 8, 9, 10, 13, 14, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "error": [3, 6, 9, 11, 13, 111, 113], "entry_point": [3, 112], "callabl": [3, 8, 9, 10, 13, 14, 15], "reward_threshold": [3, 93, 94, 95, 96, 97, 100, 101, 102, 103, 112], "nondeterminist": [3, 112], "order_enforc": [3, 112], "syntax": 3, "namespac": [3, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 112], "env_nam": [3, 17], "v": [3, 6, 68, 98], "keyword": [3, 5, 10, 14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 106, 111, 112], "entri": 3, "point": [3, 7, 9, 11, 19, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 40, 41, 42, 43, 44, 46, 50, 51, 54, 61, 62, 63, 64, 65, 66, 67, 69, 71, 72, 73, 75, 76, 79, 83, 84, 85, 87, 88, 91, 101, 104, 106, 113], "threshold": [3, 87, 88, 109, 112], "consid": [3, 14, 84, 85, 86, 92, 93, 95, 96, 103, 104, 112], "learnt": 3, "knowledg": 3, "limit": [3, 16, 35, 43, 50, 51, 64, 69, 98, 99, 111], "enabl": [3, 11, 19, 84, 104], "order": [3, 4, 5, 11, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 92, 93, 94, 95, 96, 97, 98, 99, 100, 103, 104, 112], "enforc": 3, "correct": [3, 109, 112, 113], "disabl": [3, 13], "recommend": [3, 10, 13, 18, 19, 45, 46, 47, 48, 49, 85, 93, 96, 97, 111, 112], "onli": [3, 4, 5, 6, 7, 10, 11, 12, 13, 14, 18, 19, 21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 53, 56, 58, 59, 60, 62, 63, 65, 66, 67, 68, 69, 70, 72, 73, 75, 76, 77, 79, 80, 89, 90, 93, 94, 95, 96, 98, 100, 101, 103, 104, 111, 112], "env_id": [3, 17], "retriev": [3, 13, 40, 43, 69], "global": 3, "superclass": [4, 12, 14, 15], "crucial": 4, "thei": [4, 10, 13, 14, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 101, 105, 106, 112], "serv": [4, 93, 94, 95, 96, 102, 103], "variou": [4, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 97, 104], "purpos": [4, 104], "clearli": 4, "interact": [4, 9, 19, 104, 111, 112], "environ": [4, 6, 8, 11, 12, 14, 15, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 105, 106, 107, 108, 109, 113], "look": [4, 9, 11, 13, 15, 16, 19, 21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 39, 41, 42, 43, 44, 53, 56, 58, 59, 60, 62, 63, 65, 68, 70, 72, 73, 75, 76, 77, 79, 80, 112, 113], "like": [4, 6, 9, 11, 12, 13, 14, 15, 16, 21, 22, 23, 24, 25, 26, 27, 28, 30, 32, 34, 35, 39, 41, 42, 43, 44, 53, 56, 58, 59, 60, 61, 62, 63, 64, 65, 70, 72, 73, 75, 76, 77, 79, 80, 83, 85, 93, 94, 96, 97, 99, 100, 101, 103, 104, 112], "u": [4, 6, 11, 15, 19, 104, 105, 111, 112], "work": [4, 9, 11, 13, 14, 19, 84, 85, 87, 94, 95, 98, 99, 103], "highli": [4, 18, 19, 82, 86, 112], "structur": [4, 5, 7, 104, 112], "data": [4, 7, 9, 11, 18, 111, 112], "form": [4, 5, 6, 13, 87, 102, 112], "painlessli": 4, "transform": [4, 7, 9, 11, 12, 13, 101], "them": [4, 11, 13, 17, 18, 19, 21, 22, 23, 26, 27, 31, 35, 42, 63, 72, 85, 94, 101, 104], "flat": [4, 5, 6, 7, 14], "sampl": [4, 5, 6, 7, 8, 9, 10, 14, 15, 16, 18, 85, 109, 110, 111, 112], "especi": [4, 15, 112], "hierarch": [4, 109], "via": [4, 5, 11, 13, 14, 15, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 86, 92, 104, 105, 112], "build": [4, 11, 21, 39, 43, 98, 103, 104], "express": [4, 9, 93, 96, 97], "inherit": [4, 11, 12, 14, 15, 16, 112], "cover": [4, 111], "parametr": 4, "probabl": [4, 19, 108, 109, 111, 113], "distribut": [4, 5, 6, 102], "batch": [4, 8, 10], "vectorenv": 4, "moreov": [4, 13, 19, 22, 32, 112], "implement": [4, 5, 10, 12, 13, 14, 15, 16, 17, 18, 19, 91, 98, 104, 105, 107, 112], "handl": [4, 10, 98, 111], "care": [4, 70], "immut": 4, "mask": [4, 5, 6, 18, 104, 109], "t_cov": 4, "randomli": [4, 5, 85, 112], "uniform": [4, 6, 89, 90, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "bounded": 4, "int8": [4, 6], "member": [4, 53], "possibli": [4, 5, 6, 8, 11, 13, 16, 104], "subspac": [4, 5, 6, 7], "to_json": 4, "sample_n": 4, "jsonabl": 4, "from_json": 4, "complex": [4, 5, 96, 97, 98, 99], "matric": 4, "multidiscret": [4, 5, 7, 8, 10, 16, 112], "binari": [4, 6, 16, 112], "hold": [4, 106, 111], "down": [4, 6, 19, 23, 25, 26, 32, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 52, 53, 56, 58, 60, 61, 63, 65, 73, 75, 76, 79, 80, 84, 97, 106, 107, 108, 111, 112, 113], "button": [4, 6, 9, 16], "multibinari": [4, 5, 7, 8, 16], "multipl": [4, 5, 6, 8, 10, 104], "ax": [4, 6, 111, 112], "messag": 4, "mission": [4, 52, 54, 55], "detail": [4, 9, 13, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 87, 104, 112], "join": 4, "togeth": [4, 19, 92], "vectoris": 4, "separ": [4, 5, 18, 112], "readabl": [4, 5], "fix": [4, 5, 6, 11, 13, 15, 16, 18, 52, 87, 88, 91, 92, 93, 94, 95, 96, 98, 99, 103, 108, 109, 112], "unord": 4, "entiti": 4, "select": [4, 6, 42, 93, 96, 97, 100, 101, 104], "graph": [4, 7, 16], "node": [4, 5, 7], "edg": [4, 5, 7, 88], "flatten": [4, 7, 11, 92, 107, 111, 112], "unflatten": [4, 7], "neural": [4, 7, 87, 102, 104], "network": [4, 7, 102, 104], "flatdim": [4, 7], "dimens": [4, 6, 7, 14, 93, 94, 95, 96, 102, 103, 104], "flatten_spac": [4, 7], "revers": [4, 7, 106], "size": [4, 13, 108, 112], "batch_spac": [4, 8], "concaten": [4, 7, 8, 92], "iter": [4, 5, 8, 10], "create_empty_arrai": [4, 8], "create_shared_memori": [4, 8], "read_from_shared_memori": [4, 8], "write_to_shared_memori": [4, 8], "spaces_kwarg": 5, "constitu": 5, "usag": [5, 6, 7, 11, 84], "ordereddict": [5, 8, 14], "nest": [5, 8, 104], "ext_control": 5, "5": [5, 6, 7, 8, 12, 13, 19, 21, 23, 24, 25, 26, 29, 30, 32, 35, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 53, 56, 58, 59, 60, 62, 63, 65, 72, 73, 75, 76, 77, 79, 80, 83, 84, 85, 87, 89, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103, 104, 106, 109, 111, 112], "inner_st": 5, "charg": 5, "100": [5, 7, 13, 33, 43, 66, 67, 83, 84, 85, 87, 90, 95, 100, 107], "system_check": 5, "10": [5, 6, 12, 19, 26, 32, 45, 46, 47, 48, 49, 56, 63, 66, 69, 83, 85, 91, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103, 104, 106, 107, 109, 111, 112], "job_statu": 5, "progress": [5, 75], "conveni": [5, 11, 16, 112], "easili": [5, 11, 104], "flattenobserv": [5, 11, 14, 112], "similar": [5, 18, 23, 34, 100, 112], "deal": 5, "instanti": [5, 9, 13, 14, 15, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 112], "either": [5, 6, 7, 9, 13, 16, 17, 19, 42, 52, 89, 90, 106, 108], "avoid": [5, 8, 11, 16, 19, 22, 23, 25, 30, 31, 39, 41, 57, 58, 60, 65, 67, 68, 73], "independ": [5, 6, 10, 95, 101, 102, 103], "same": [5, 7, 9, 10, 14, 51, 83, 84, 87, 100, 101, 102, 109, 111, 113], "attr": 5, "warn": [5, 9, 10, 13], "guarante": [5, 19], "uniqu": [5, 82, 86, 92, 98], "sub": [5, 10, 69], "precis": 5, "cartesian": [5, 6, 91], "product": [5, 6], "03633198": 5, "42370757": 5, "involv": [5, 82, 98, 99, 104, 108, 112], "reproduc": [5, 18], "method": [5, 9, 12, 13, 14, 15, 17, 104, 109, 112], "draw": [5, 106, 111, 112], "42": [5, 6, 88, 96, 97, 110], "54": 5, "finit": [5, 6, 12, 93, 97, 98, 99, 100, 101, 103, 113], "a_0": 5, "dot": [5, 6, 112], "a_n": 5, "a_i": 5, "belong": [5, 8, 104], "n": [5, 6, 7, 8, 16, 19, 38, 84, 87, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 111], "0259352": 5, "80977976": 5, "80066574": 5, "77165383": 5, "must": [5, 7, 8, 9, 10, 11, 12, 13, 14, 16, 18, 19, 20, 21, 24, 26, 27, 28, 29, 31, 35, 36, 37, 40, 43, 44, 53, 57, 59, 60, 65, 84, 95, 103, 104, 112, 113], "length_mask": 5, "sample_mask": 5, "drawn": [5, 6, 100, 102], "geometr": 5, "featur": [5, 6, 104], "feature_spac": 5, "node_spac": [5, 7], "edge_spac": [5, 7], "seri": [5, 16], "adjac": 5, "matrix": [5, 107], "edge_link": [5, 7], "num_nod": 5, "num_edg": 5, "graphinst": [5, 7], "between": [5, 6, 13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 85, 87, 88, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 111, 112, 113], "don": [5, 11, 18, 19, 35, 45, 46, 47, 48, 49, 69, 84, 89, 112, 113], "edge_mask": 5, "multipli": [5, 90], "attribut": [5, 16, 18, 100, 101, 112], "_gener": 6, "unbound": 6, "mathbb": 6, "interv": [6, 16, 93, 95, 96, 103], "There": [6, 11, 16, 51, 52, 64, 83, 84, 85, 86, 89, 90, 92, 97, 98, 99, 100, 101, 104, 106, 107, 109, 112], "common": [6, 11, 14, 16, 113], "ident": [6, 10, 14], "lower": [6, 16, 93, 94, 95, 96, 97, 100, 101, 102, 103, 111], "upper": [6, 16, 96, 97], "construct": [6, 19, 45, 46, 47, 48, 49, 87, 93, 94, 95, 96, 102, 103, 112], "scalar": [6, 12], "respect": [6, 10, 11, 13, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 85, 87, 93, 96, 97, 102], "assum": [6, 14, 112], "across": [6, 8, 25, 35, 46, 47, 50], "infer": [6, 92], "essenti": 6, "valueerror": [6, 7, 8, 10, 13, 14], "coordin": [6, 11, 14, 83, 85, 91, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103, 104], "shift": [6, 16], "exponenti": [6, 11, 15], "unsupport": 6, "is_bound": 6, "manner": [6, 11, 14, 51], "both": [6, 10, 13, 14, 16, 17, 83, 86, 87, 101, 103, 104, 106, 108, 109, 112, 113], "sens": [6, 104], "One": [6, 16, 93, 96, 97, 104], "neither": [6, 13, 106], "nor": [6, 13, 106, 107], "consist": [6, 11, 14, 16, 19, 32, 83, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 111, 112], "mani": [6, 13, 14, 16, 19, 25, 28, 32, 51, 54, 69, 79, 104, 111, 112], "subset": [6, 12, 19, 45, 46, 47, 48, 49, 112], "smallest": 6, "uniformli": [6, 19, 87, 88, 100, 101, 112], "infeas": 6, "sort": 6, "fair": 6, "coin": 6, "toss": 6, "per": [6, 10, 32, 51, 74, 109, 113], "nvec": 6, "int64": [6, 7], "game": [6, 9, 13, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 106, 111, 112], "keyboard": [6, 9], "alwai": [6, 7, 13, 19, 85, 89, 90, 93, 96, 97, 100, 102, 108, 109, 112], "noop": [6, 9, 13, 19, 21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 53, 56, 58, 59, 60, 62, 63, 65, 70, 72, 73, 75, 76, 77, 79, 80], "nintendo": 6, "conceptu": 6, "arrow": [6, 63], "left": [6, 19, 21, 23, 24, 25, 26, 30, 34, 35, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 52, 53, 56, 58, 59, 60, 62, 65, 69, 70, 72, 73, 75, 76, 79, 80, 83, 84, 85, 88, 89, 93, 96, 97, 98, 99, 103, 107, 108, 111, 112], "param": 6, "min": [6, 12, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "max": [6, 12, 13, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 111], "press": [6, 9, 16, 84, 87], "although": 6, "rare": 6, "d": [6, 9, 87, 100, 101, 104], "categor": 6, "vector": [6, 9, 11, 83, 85, 97, 98, 99, 100, 101, 108], "count": [6, 83, 85, 106, 111], "complic": [6, 11], "kind": 6, "unless": [6, 11, 109, 112], "max_length": 6, "min_length": 6, "charset": 6, "frozenset": 6, "6": [6, 7, 19, 23, 24, 25, 26, 30, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 53, 56, 58, 60, 74, 75, 76, 79, 80, 87, 89, 90, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103, 107, 109], "7": [6, 9, 19, 23, 25, 26, 30, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 53, 56, 58, 60, 75, 76, 79, 80, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103], "8": [6, 9, 10, 17, 19, 21, 23, 25, 26, 28, 30, 34, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 53, 56, 58, 59, 75, 79, 80, 84, 85, 87, 88, 91, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103, 108], "9": [6, 8, 10, 19, 23, 26, 31, 40, 45, 46, 47, 48, 49, 53, 56, 66, 75, 80, 87, 91, 93, 94, 95, 96, 97, 98, 100, 101, 103, 106, 111], "c": [6, 68, 85, 87, 104], "f": [6, 14, 15, 108, 111], "h": [6, 108], "j": [6, 19], "k": [6, 7, 9, 13, 85, 102], "l": [6, 13, 102], "m": [6, 7, 19, 38, 87, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 112], "o": 6, "p": [6, 94, 108, 109], "q": [6, 65, 109, 113], "w": [6, 9, 93, 96, 97], "z": [6, 93, 94, 95, 96, 97, 100, 101, 103], "compris": 6, "charact": [6, 9, 53, 64], "b5": 6, "hello": 6, "0123456789": 6, "digit": [6, 104], "inclus": [6, 19], "prevent": [6, 10, 42, 104], "empti": [6, 8, 13, 69, 111], "english": 6, "alphabet": 6, "plu": [6, 35, 107], "latin": 6, "charlist": 6, "zero": [6, 8, 91, 94, 104, 111, 112, 113], "matter": 6, "equival": [7, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "would": [7, 12, 14, 15, 93, 94, 95, 96, 97, 102, 103, 110, 112], "notimplementederror": 7, "cannot": [7, 8, 13, 16, 18, 107, 112, 113], "attempt": [7, 85, 97, 98], "compound": 7, "func": 7, "oper": [7, 13], "itself": [7, 10, 11, 13, 16, 17, 104], "boundari": 7, "while": [7, 18, 19, 22, 23, 39, 54, 57, 58, 59, 60, 63, 65, 67, 69, 73, 76, 78, 85, 87, 88, 91, 93, 94, 96, 97, 100, 101, 102, 104, 106, 111, 112, 113], "being": [7, 13, 40, 89, 90, 91, 93, 96, 97, 101, 104, 109, 111], "exactli": [7, 102], "origin": [7, 10, 12, 13, 14, 18, 84, 87, 98, 100, 101], "effect": [7, 8, 11, 13, 14, 16, 19, 45, 46, 47, 48, 49, 85, 98, 99, 109, 111], "flattenend": 7, "60": [7, 53, 66, 104], "recurs": 7, "12": [7, 19, 26, 28, 32, 34, 45, 46, 47, 48, 49, 53, 56, 68, 85, 87, 88, 93, 94, 95, 96, 97, 100, 103, 111], "hot": 7, "match": [7, 10, 12, 74], "copi": [8, 10, 112], "item": [8, 9, 104, 111], "_": [8, 9, 10, 11, 16, 110], "6348213": 8, "28607962": 8, "60760117": 8, "87383074": 8, "192658": 8, "2148103": 8, "99644893": 8, "08304597": 8, "7238421": 8, "35848552": 8, "1533453": 8, "67958736": 8, "49076623": 8, "38661423": 8, "7975036": 8, "93317133": 8, "stopiter": 8, "fn": 8, "built": [8, 18, 104], "multi_binari": 8, "multi_discret": 8, "ctx": 8, "multiprocess": [8, 10], "opt": 8, "hostedtoolcach": 8, "15": [8, 19, 42, 45, 46, 47, 48, 49, 53, 72, 85, 93, 94, 96, 97, 100, 103, 104, 108], "x64": 8, "lib": [8, 107], "python3": 8, "process": [8, 9, 10, 14, 16, 87, 100, 112, 113], "eventu": 8, "shared_memori": [8, 10], "customspaceerror": 8, "read": [8, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109], "forward": [8, 30, 52, 83, 93, 94, 95, 96, 97, 102, 103], "vice": [8, 13], "versa": [8, 13], "side": [8, 14, 21, 34, 49, 51, 85], "write": [8, 10, 112], "num_env": [8, 10], "plai": [9, 16, 29, 42, 55, 74, 79, 84, 104, 106, 111, 112], "transpos": [9, 112], "zoom": 9, "callback": 9, "keys_to_act": 9, "dw": 9, "particularli": [9, 13, 88], "verifi": 9, "level": [9, 16, 19, 26, 43, 65, 73, 104], "preprocess": [9, 11], "unplay": 9, "wish": [9, 14, 18], "real": [9, 51, 94, 104], "statist": 9, "playplot": 9, "here": [9, 87, 112], "last": [9, 13, 41, 42, 52, 94, 97, 100, 101, 112, 113], "150": 9, "def": [9, 11, 12, 14, 15, 111, 112], "obs_t": 9, "obs_tp1": 9, "rew": [9, 113], "plotter": 9, "render_fp": [9, 13, 112], "30": [9, 13, 19, 63, 66, 96, 97], "amount": [9, 39, 41, 42, 44, 50, 69, 83, 88, 98, 99], "input": [9, 10, 16, 111], "receiv": [9, 10, 16, 29, 32, 36, 39, 40, 46, 52, 55, 84, 85, 90, 103, 111, 113], "map": [9, 14, 16, 37, 108, 109, 111, 112], "unicod": 9, "suppos": 9, "trigger": [9, 109], "key_to_act": 9, "ord": [9, 112], "unknown": [9, 104], "horizon_timestep": 9, "plot_nam": 9, "live": [9, 22, 25, 28, 29, 31, 34, 39, 40, 43, 50, 54, 55, 61, 67, 72, 111], "transit": [9, 16, 19, 45, 46, 47, 48, 49, 96, 97, 109, 113], "compute_metr": 9, "obs_tp": 9, "cumulative_reward": 9, "linalg": [9, 112], "norm": [9, 100, 101, 112], "its": [9, 10, 12, 13, 34, 41, 64, 76, 81, 85, 91, 92, 102, 104], "along": [9, 11, 16, 17, 53, 54, 56, 67, 84, 88, 89, 90, 94, 98, 99, 102, 104], "conjunct": 9, "evolv": 9, "200": [9, 44, 67, 85, 87, 88, 89, 91], "immedi": [9, 11, 15, 106, 112], "cumul": [9, 11, 13], "magnitud": [9, 85, 90, 98, 99], "your_env": 9, "len": [9, 12, 111], "horizon": [9, 69, 95, 103, 113], "titl": [9, 89, 90, 111], "dependencynotinstal": [9, 13], "matplotlib": [9, 111], "playablegam": 9, "process_ev": 9, "event": [9, 112], "particular": [9, 11, 14, 16, 17, 85, 113], "keep": [9, 11, 13, 27, 40, 59, 62, 70, 71, 79, 88, 97, 112], "track": [9, 11, 13, 71, 84, 88, 93, 94, 95, 96, 97, 98, 99, 102, 103], "exit": [9, 10], "save_video": 9, "video_fold": [9, 13], "episode_trigg": [9, 13], "step_trigg": [9, 13], "video_length": [9, 13], "name_prefix": [9, 13], "rl": [9, 13, 110, 111, 113], "episode_index": 9, "step_starting_index": 9, "extract": 9, "compos": 9, "record": [9, 11, 83], "store": [9, 10, 13], "iff": [9, 13, 112], "isn": 9, "entir": [9, 13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 95, 103, 104], "snippet": [9, 13], "captur": [9, 13, 78], "Will": [9, 13], "prepend": [9, 13], "filenam": [9, 13], "moviepi": [9, 13], "imagesequenceclip": 9, "durat": [9, 93, 95, 96, 97, 98, 99, 100, 101, 103], "step_index": 9, "199": 9, "capped_cubic_video_schedul": 9, "episode_id": 9, "27": [9, 87, 93, 96, 97], "729": 9, "1000": [9, 13, 16, 67, 69, 84, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 110], "2000": [9, 83], "3000": 9, "schedul": [9, 108], "step_api_compat": [9, 17], "step_return": 9, "output_truncation_bool": [9, 13], "is_vector_env": 9, "doc": [9, 13, 85], "ob": [9, 11, 14, 109, 111], "interfac": [9, 104, 110], "conflict": [9, 104], "written": [9, 11, 18], "final": [9, 10, 13, 52, 111, 112, 113], "desir": [9, 102, 103], "oldenv": 9, "vec_env": 9, "convert_to_terminated_truncated_step_api": [9, 17], "irrespect": 9, "convert_to_done_step_api": 9, "omit": [9, 92, 93, 94, 95, 96, 97, 102, 103], "env_check": 9, "check_env": 9, "skip_render_check": 9, "invas": [9, 73], "farama": [9, 11, 104, 111, 112], "org": [9, 19, 104, 111], "content": 9, "environment_cr": [9, 112], "ignor": [9, 19, 106, 111], "skip": [9, 13, 19, 112], "ci": 9, "parallel": 10, "linear": [10, 85, 87, 98, 99, 102], "speed": [10, 30, 83, 84, 109], "taken": [10, 13, 43, 49, 86, 88, 109, 112], "wait": [10, 43, 45, 69, 113], "until": [10, 11, 42, 55, 100, 106, 112], "overwritten": [10, 11], "final_observ": [10, 13], "final_info": [10, 13], "asyncvectorenv": 10, "syncvectorenv": 10, "single_observation_spac": 10, "single_action_spac": 10, "v25": [10, 18], "old": [10, 11, 13, 17, 110], "vectorlistinfo": [10, 11, 13], "rememb": [10, 13, 84, 112], "share": 10, "other": [10, 11, 12, 13, 14, 17, 25, 34, 37, 45, 51, 85, 91, 92, 94, 98, 100, 101, 103, 109, 111, 112], "word": [10, 100], "02240574": 10, "03439831": 10, "03904812": 10, "02810693": 10, "01586068": 10, "01929009": 10, "02394426": 10, "04016077": 10, "01314174": 10, "03893502": 10, "02400815": 10, "0038326": 10, "instead": [10, 14, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 87, 103, 112], "00122802": 10, "16228443": 10, "02521779": 10, "23700266": 10, "00788269": 10, "17490888": 10, "03393489": 10, "31735462": 10, "04918966": 10, "19421194": 10, "02938497": 10, "29495203": 10, "releas": [10, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 87, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109, 112], "resourc": [10, 111, 112], "viewer": 10, "close_extra": 10, "synchron": 10, "asynchron": 10, "garbag": 10, "program": [10, 104], "04456399": 10, "04653909": 10, "01326909": 10, "02099827": 10, "03073904": 10, "00145001": 10, "03088818": 10, "03131252": 10, "03468829": 10, "01500225": 10, "01230312": 10, "01825218": 10, "registri": [10, 16], "env_fn": 10, "context": 10, "daemon": 10, "worker": [10, 63], "pipe": 10, "commun": 10, "lambda": [10, 14, 15, 111], "81": [10, 91], "62": 10, "8286432": 10, "5597771": 10, "90249056": 10, "85009176": 10, "5266346": 10, "60007906": 10, "back": [10, 11, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 47, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 93, 94], "improv": 10, "effici": [10, 14, 89, 90, 98, 104], "larg": [10, 11, 18, 90, 93, 94, 95, 96, 97, 100, 101, 102, 103, 104], "subprocess": 10, "flag": [10, 89, 104], "turn": [10, 13, 18, 22, 23, 84, 85, 98], "quit": [10, 112], "head": [10, 94], "spawn": [10, 101], "children": 10, "overrid": [10, 11], "inner": 10, "logic": [10, 84, 112], "advanc": [10, 87, 104], "degre": [10, 14, 96, 97, 98], "flexibl": [10, 104], "chanc": 10, "shoot": [10, 26, 35, 37, 42, 43, 50, 51, 60, 63, 67, 72, 73, 81], "yourself": [10, 43, 63, 84, 111, 112], "foot": [10, 94, 95, 103], "thu": [10, 19, 45, 46, 47, 48, 49, 100, 101, 104], "own": [10, 18, 34, 69], "_worker": 10, "_worker_shared_memori": 10, "runtimeerror": 10, "serial": 10, "modular": [11, 12, 14, 15, 16, 104, 112], "behavior": [11, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 91, 93, 94, 95, 96, 97, 102, 103, 104, 112], "modif": [11, 100, 101], "without": [11, 16, 41, 96, 106, 108, 111, 112], "alter": [11, 16, 19, 112], "lot": [11, 16, 111], "boilerpl": [11, 16, 112], "chain": [11, 16, 87, 102], "rescaleact": [11, 12, 16], "base_env": [11, 16], "wrapped_env": [11, 12, 13, 16, 112], "min_act": [11, 12, 16], "max_act": [11, 12, 16], "access": [11, 13, 18, 50], "underneath": [11, 16, 88], "anoth": [11, 34, 96, 97, 99, 100, 101, 103, 109, 111, 113], "orderenforc": [11, 13, 16, 112], "get": [11, 16, 19, 39, 42, 43, 44, 51, 61, 62, 63, 64, 66, 67, 68, 73, 83, 85, 93, 95, 96, 98, 106, 111, 113], "layer": [11, 16, 104], "bare": 11, "just": [11, 16, 45, 51, 68, 99, 101], "box2d": [11, 16, 83, 84, 85], "bipedal_walk": [11, 16, 83], "0x7f87d70712d0": [11, 16], "three": [11, 19, 22, 25, 27, 40, 48, 54, 61, 66, 67, 68, 69, 93, 95, 96, 97, 102, 103, 112], "thing": [11, 14, 19], "do": [11, 13, 14, 15, 19, 32, 44, 65, 69, 70, 84, 85, 87, 93, 94, 95, 96, 102, 103, 112], "Such": 11, "actionwrapp": [11, 12], "observationwrapp": [11, 14, 112], "rewardwrapp": [11, 15], "present": [11, 87, 104, 111, 112, 113], "section": [11, 19, 70, 93, 94, 95, 96, 102, 103, 111, 112], "found": [11, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 92, 111], "github": [11, 92, 107, 112], "com": [11, 104, 107, 112], "foundat": [11, 104, 112], "forget": [11, 112], "commonli": [11, 16], "page": [11, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 109], "descript": [11, 104, 112], "ataripreprocess": [11, 13], "misc": 11, "tp": 11, "atari": [11, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 111], "clipact": [11, 12, 16], "clip": [11, 15, 16, 89, 90, 93, 96, 112], "envcompat": [11, 13, 17, 18], "compat": [11, 14, 16, 104, 110], "21": [11, 17, 93, 96, 97, 100, 106, 111], "filterobserv": [11, 14], "filter": 11, "request": [11, 106], "framestack": [11, 13], "anobserv": 11, "stack": [11, 14], "roll": [11, 14, 32, 100], "grayscaleobserv": [11, 14], "grai": [11, 13], "scale": [11, 13, 15, 19, 85, 93, 94, 95, 96, 102, 103, 104], "humanrend": [11, 13], "normalizeobserv": [11, 14], "center": [11, 14, 84, 85, 88, 91, 93, 94, 96, 97, 107], "unit": [11, 14, 53, 87, 89, 90, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "varianc": [11, 14, 15], "normalizereward": [11, 15], "averag": [11, 15, 96, 113], "pixelobservationwrapp": [11, 14], "augment": [11, 14], "obtain": [11, 13, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 91, 106, 113], "ad": [11, 13, 14, 16, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 47, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 85, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 109, 112], "replac": [11, 18, 106, 111], "recordepisodestatist": [11, 13, 18, 111], "recordvideo": [11, 13, 18], "rollout": [11, 13, 109], "save": [11, 13, 18], "rescal": [11, 16], "resizeobserv": [11, 14], "axbxc": [11, 14], "resiz": [11, 13], "timeawareobserv": [11, 14, 16], "trajectori": [11, 14, 15, 85, 96, 97], "append": [11, 14, 111], "transformobserv": [11, 14], "transformreward": [11, 15], "th": 11, "sometim": [11, 15, 112], "still": [11, 18, 19, 111], "let": [11, 12, 15, 19, 34, 104, 111, 112], "penal": [11, 70], "energi": [11, 83, 85, 88, 104], "weight": [11, 93, 94, 95, 96, 100, 101, 102, 103, 104, 113], "those": [11, 21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 39, 41, 42, 43, 44, 53, 56, 58, 59, 60, 62, 63, 65, 70, 72, 73, 75, 76, 77, 79, 80, 87, 92, 93, 94, 95, 96, 97, 98, 99, 103], "nevertheless": 11, "reacherrewardwrapp": 11, "reward_dist_weight": 11, "reward_ctrl_weight": 11, "reward_dist": [11, 100, 101], "reward_ctrl": [11, 100, 101], "suffici": [11, 25, 27, 29, 31, 36, 111], "simpli": [12, 13, 14, 15, 19, 107, 112], "overwrit": [12, 14, 15], "domain": [12, 84, 87, 89, 90, 104, 109], "sai": [12, 13], "discreteact": 12, "disc_to_cont": 12, "act": [12, 111], "__name__": 12, "__main__": 12, "print": [12, 112], "among": [12, 14, 86, 92], "biped": [12, 82, 96, 97], "walker": [12, 82, 92, 101, 103], "affin": [12, 85], "75": [12, 93], "noop_max": 13, "frame_skip": [13, 93, 94, 95, 96, 102, 103], "screen_siz": 13, "84": [13, 93, 96, 97], "terminal_on_life_loss": 13, "grayscale_ob": 13, "grayscale_newaxi": 13, "scale_ob": 13, "2600": [13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "guidelin": 13, "machado": [13, 19], "et": [13, 19], "al": [13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 111], "2018": [13, 19, 87], "revisit": [13, 19], "arcad": [13, 19, 26, 43, 45, 46, 47, 48, 49, 104], "evalu": [13, 19, 104, 111], "protocol": [13, 19], "open": [13, 19, 32, 92, 104, 112], "problem": [13, 19, 85, 88, 91, 98, 99, 102, 106, 109, 110, 113], "stage": 13, "op": 13, "pool": [13, 102], "recent": [13, 14, 15, 17, 104], "life": [13, 25, 39, 43, 67, 71], "lost": [13, 28, 36, 55, 68, 72], "loss": [13, 106], "off": [13, 18, 36, 51, 59, 67, 84, 85, 109], "Not": 13, "squar": [13, 14, 68, 100, 101, 109, 112], "210x180": 13, "84x84": 13, "grayscal": [13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "colour": [13, 84], "greyscal": 13, "255": [13, 14, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 84, 112], "No": [13, 87, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "frequenc": 13, "experi": [13, 93, 96, 97, 98, 99, 104, 111], "whenev": [13, 25, 28, 112], "channel": 13, "axi": [13, 89, 90, 94, 96, 97, 102, 111], "dimension": [13, 16, 23, 85, 93, 94, 95, 101, 102, 103, 104, 112], "memori": [13, 14, 89, 90], "optim": [13, 19, 83, 85, 96, 97, 104, 111], "benefit": 13, "opencv": 13, "caus": [13, 16, 52], "new_ob": 13, "final_reward": 13, "final_termin": 13, "final_trunc": 13, "final_don": 13, "prior": 13, "alongsid": [13, 104], "previou": [13, 93, 96, 97, 113], "re": [13, 51, 66, 69, 112], "old_env": 13, "legacyenv": 13, "retun": 13, "modern": [13, 104], "convers": [13, 17, 104], "passiveenvcheck": [13, 16], "cartpoleenv": 13, "customenv": 13, "manual": [13, 16, 18, 19, 45, 46, 47, 48, 49, 104], "unregist": 13, "surround": [13, 104], "test": [13, 83, 104, 112], "haven": 13, "screen": [13, 19, 21, 25, 29, 34, 35, 37, 46, 52, 58, 68, 69, 93, 94, 95, 96, 97, 98, 99, 102, 103], "nativ": [13, 105], "nonativerend": 13, "disable_render_order_enforc": 13, "classic_control": [13, 18, 86], "resetneed": 13, "deque_s": [13, 111], "At": [13, 16, 28, 39, 42, 53], "_episod": 13, "elaps": 13, "sinc": [13, 17, 19, 45, 46, 47, 48, 49, 82, 88, 92, 101, 104, 109, 112, 113], "begin": [13, 18, 25, 28, 41, 66, 67, 68, 69, 111, 112], "num": [13, 19, 21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 53, 56, 58, 59, 60, 62, 63, 65, 70, 72, 73, 75, 76, 77, 79, 80, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "buffer": [13, 14, 84], "return_queu": [13, 111], "length_queu": [13, 111], "disable_logg": 13, "intermitt": 13, "hundredth": 13, "emploi": 13, "stop": [13, 16, 63, 73, 81, 104, 106, 111, 113], "span": 13, "strictli": 13, "logger": 13, "pop_fram": 13, "reset_clean": 13, "clear": [13, 73], "issu": [13, 16, 18, 19, 93, 95, 96, 97, 103, 112], "place": [13, 23, 88, 89, 90, 112], "part": [13, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 109, 113], "\u01f9one": 13, "intend": [13, 104, 108], "around": [13, 29, 82, 101, 104], "outermost": 13, "actual": [13, 109, 112], "_k": 13, "classic": [13, 16, 18, 85, 87, 88, 89, 90, 91, 95, 99, 102, 103, 104, 113], "reflect": [14, 88], "2d": [14, 101, 104], "navig": [14, 28, 64, 112], "agent_posit": 14, "target_posit": 14, "throw": [14, 54], "awai": [14, 22, 62, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "freedom": [14, 96, 97, 98], "target": [14, 35, 87, 100, 101, 104, 112, 113], "rel": [14, 87, 96, 97, 112], "relativeposit": [14, 112], "ideal": 14, "subclass": 14, "accordingli": [14, 69, 112], "were": [14, 18, 36, 82, 87, 105, 112], "incorrectli": [14, 113], "randn": 14, "08319338": 14, "04635121": 14, "07394746": 14, "20877492": 14, "filter_kei": 14, "00067088": 14, "01860439": 14, "04772898": 14, "01911527": 14, "04560107": 14, "04466959": 14, "0328232": 14, "02367178": 14, "04649447": 14, "14996664": 14, "03329664": 14, "25847703": 14, "96": [14, 19, 84], "27648": 14, "num_stack": 14, "lz4_compress": 14, "lazyfram": 14, "fill": [14, 28, 112], "lz4": 14, "compress": 14, "keep_dim": 14, "uint8": [14, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "singleton": 14, "axbx1": 14, "axb": 14, "epsilon": [14, 15, 104, 111], "1e": [14, 15, 96, 102, 103], "08": [14, 15], "past": [14, 15], "newli": [14, 15], "stabil": [14, 15, 96, 97], "pixels_onli": 14, "render_kwarg": 14, "pixel_kei": 14, "choos": [14, 112], "odict_kei": 14, "400": [14, 109], "600": 14, "discard": 14, "assertionerror": 14, "show": [14, 18, 19, 29, 35, 106, 111], "typeerror": 14, "unexpect": 14, "64": [14, 19], "03810719": 14, "03522411": 14, "02231044": 14, "01088205": 14, "03881167": 14, "16021058": 14, "0220928": 14, "28875574": 14, "becaus": [15, 18, 111, 112], "intrins": 15, "gain": [15, 29, 65, 71, 72, 75], "numer": [15, 97, 98, 99, 106], "clipreward": 15, "min_reward": 15, "max_reward": 15, "invari": 15, "incorrect": [15, 113], "gamma": [15, 113], "99": 15, "discount": [15, 111, 113], "factor": [15, 111], "project": [16, 18, 104, 111], "mountain": [16, 86], "car": [16, 28, 44, 82, 86, 104], "four": [16, 28, 39, 84, 85, 93, 95, 103, 109, 111], "introduc": [16, 17, 18, 93, 96, 97], "core": 16, "markov": [16, 113], "decis": [16, 18, 104, 113], "theori": [16, 91, 98, 104], "perfect": 16, "reconstruct": 16, "miss": [16, 70, 87, 109], "compon": [16, 112], "veri": [16, 85, 100, 112], "easi": [16, 55, 104, 105], "loop": [16, 18, 104, 111], "pictur": 16, "simplifi": [16, 91, 104], "someth": 16, "spaceship": [16, 26, 40, 71], "land": [16, 33, 67, 85], "safe": [16, 63, 85], "document": [16, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 86, 93, 96, 97, 98, 105, 111, 112], "imagin": [16, 104], "robot": [16, 18, 31, 81, 83, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 113], "destroi": [16, 22, 24, 26, 27, 28, 29, 30, 31, 34, 35, 36, 37, 40, 41, 49, 55, 66, 67, 68, 71, 72, 73, 75, 85], "enemi": [16, 23, 24, 27, 29, 30, 31, 37, 40, 41, 43, 56, 65, 66, 68, 69, 71, 72, 73, 75, 81], "exchang": 16, "crash": [16, 85], "succeed": 16, "similarli": [16, 85], "restart": 16, "train": [16, 18, 109], "major": 16, "our": [16, 104, 111, 112], "simpl": [16, 83, 105, 107, 110, 113], "util": [16, 17, 112], "coupl": 16, "nich": 16, "li": [16, 104], "lie": 16, "full": [16, 19, 45, 46, 47, 48, 49, 84, 85, 111], "aspect": [16, 113], "regist": [17, 19], "sole": 17, "special": [17, 22, 52], "gymv26environ": 17, "relev": [17, 112], "pong": [17, 19, 34, 38], "v5": [17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "signific": 17, "introduct": [17, 87, 106, 107], "signatur": 17, "previous": [17, 19, 28], "backward": [17, 94], "compliant": [17, 18], "oldv21env": 17, "break": [18, 26, 34, 84], "briefli": 18, "outlin": [18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 106, 111], "stuck": [18, 22, 31, 50], "123": 18, "emul": [18, 19], "awar": 18, "randint": 18, "utilis": 18, "contrast": 18, "older": [18, 92], "definit": [18, 93, 95, 96, 113], "expand": [18, 19, 45, 46, 47, 48, 49], "blog": 18, "post": [18, 27], "soon": [18, 109, 112], "extra": [18, 23, 28, 29, 31, 35, 37, 50, 69, 104, 111, 112], "These": [18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 92, 93, 96, 102, 104, 105, 111], "address": 18, "associ": 18, "librari": [18, 104, 105, 110, 112], "primari": 18, "shouldn": [18, 112], "happen": [18, 68, 89, 90, 93, 95, 96, 97, 98, 99, 100, 101, 103, 113], "fly": [18, 21, 26, 50, 66, 85], "shown": [18, 54, 84, 87, 113], "explan": [18, 111], "summari": 18, "goalenv": 18, "reimplement": 18, "system": [18, 49, 87, 91, 98, 99], "monitor": 18, "stella": 19, "adventur": [19, 38], "air": [19, 38], "raid": [19, 38], "alien": [19, 38, 40, 60, 73], "amidar": [19, 27, 38], "assault": [19, 38], "asterix": [19, 38], "asteroid": [19, 38], "atlanti": [19, 38], "licens": [19, 104, 111], "download": [19, 104, 111, 112, 113], "locat": [19, 55, 104, 109, 112], "agre": 19, "todo": 19, "legal": [19, 45, 46, 47, 48, 49], "fire": [19, 21, 23, 24, 26, 27, 30, 32, 34, 35, 45, 46, 47, 48, 49, 52, 59, 60, 62, 63, 65, 66, 68, 69, 72, 73, 75, 77, 79, 80, 85], "upright": [19, 25, 26, 30, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 53, 58, 88, 91, 98, 99], "upleft": [19, 25, 26, 30, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 53, 58], "downright": [19, 25, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 53, 56, 58], "downleft": [19, 25, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 53, 56, 58], "upfir": [19, 23, 26, 32, 45, 46, 47, 48, 49, 63, 75, 76, 77, 79, 80], "11": [19, 26, 45, 46, 47, 48, 49, 53, 56, 93, 94, 95, 96, 97, 98, 100, 101, 103, 106, 107, 111], "rightfir": [19, 21, 23, 24, 26, 27, 30, 35, 45, 46, 47, 48, 49, 53, 56, 59, 60, 62, 72, 75, 76, 79, 80], "leftfir": [19, 21, 23, 24, 26, 27, 35, 45, 46, 47, 48, 49, 53, 56, 59, 60, 62, 72, 75, 76, 79, 80], "13": [19, 26, 45, 46, 47, 48, 49, 53, 56, 93, 94, 96, 97, 100, 103], "downfir": [19, 23, 26, 32, 45, 46, 47, 48, 49, 53, 56, 60, 63, 75, 77, 80], "14": [19, 45, 46, 47, 48, 49, 53, 83, 85, 93, 94, 96, 97, 100, 103, 111], "uprightfir": [19, 26, 45, 46, 47, 48, 49, 53, 56], "upleftfir": [19, 26, 45, 46, 47, 48, 49, 53, 56], "16": [19, 28, 31, 34, 40, 45, 46, 47, 48, 49, 53, 91, 93, 94, 96, 97, 100, 103, 108, 111], "downrightfir": [19, 45, 46, 47, 48, 49, 53, 56], "17": [19, 31, 45, 46, 47, 48, 49, 53, 93, 94, 96, 97, 100, 103, 106], "downleftfir": [19, 45, 46, 47, 48, 49, 53, 56], "smaller": [19, 24, 26, 45, 46, 47, 48, 49], "enumer": [19, 45, 46, 47, 48, 49], "full_action_spac": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "reduc": [19, 21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 53, 56, 58, 59, 60, 62, 63, 65, 70, 72, 73, 75, 76, 77, 79, 80, 88, 111], "difficulti": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 104], "choic": 19, "player": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 104, 106, 111], "128": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "byte": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "ram": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "consol": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "exact": [19, 32, 45, 46, 47, 48, 49, 106, 111], "atariag": [19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 74, 76, 77, 78, 79, 80, 81], "determinist": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 87, 89, 90, 107, 109, 112], "art": 19, "memor": 19, "sticki": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "small": [19, 49, 68, 83, 104, 105], "On": [19, 60, 87, 88, 89, 90, 91], "top": [19, 34, 39, 46, 52, 54, 68, 84, 85, 86, 89, 90, 95, 98, 99, 103, 112], "repeat": [19, 100], "frameskip": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "exclus": [19, 104], "tabl": [19, 22, 23, 25, 39, 41, 96, 97, 100], "obs_typ": 19, "Its": 19, "repeat_action_prob": [19, 45, 46, 47, 48, 49], "stick": [19, 28, 50, 106, 111], "ll": [19, 52, 69, 111], "sound": 19, "lock": 19, "proper": 19, "audio": 19, "framer": [19, 97, 100, 101, 112], "best": [19, 45, 46, 47, 48, 49, 104, 111], "practic": [19, 45, 46, 47, 48, 49, 104, 111, 113], "configur": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 86, 92, 104, 105, 111, 112], "variat": 19, "amidardeterminist": 19, "amidarnoframeskip": 19, "ramdeterminist": 19, "ramnoframeskip": 19, "suffix": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "noframeskip": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "airraid": [19, 21], "31": [19, 26, 96, 97], "bankheist": [19, 28], "20": [19, 28, 34, 61, 69, 85, 93, 96, 97, 100, 109, 111], "24": [19, 28, 34, 59, 83, 84, 85, 88, 93, 96, 97, 111], "28": [19, 28, 34, 87, 96, 97], "battlezon": [19, 29], "beamrid": [19, 30], "berzerk": [19, 38], "18": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 93, 94, 96, 97, 100, 103], "bowl": [19, 38], "breakout": [19, 38], "32": [19, 34, 51, 96, 97, 106], "36": [19, 34, 96, 97], "40": [19, 34, 59, 96, 97], "44": [19, 34, 96, 97], "carniv": [19, 38], "centiped": [19, 38], "22": [19, 36, 93, 96, 97, 100, 111], "86": [19, 36], "choppercommand": [19, 37], "crazyclimb": [19, 39], "defend": [19, 27, 38, 43, 59, 71], "demonattack": [19, 41], "doubledunk": [19, 42], "elevatoract": [19, 43], "enduro": [19, 38], "fishingderbi": 19, "freewai": [19, 38], "frostbit": [19, 38], "gopher": [19, 38], "gravitar": [19, 38], "hero": [19, 38], "icehockei": 19, "jamesbond": [19, 38], "journeyescap": 19, "kangaroo": [19, 38], "krull": [19, 38], "kungfumast": [19, 56], "montezumareveng": [19, 57], "mspacman": [19, 58], "namethisgam": [19, 59], "phoenix": [19, 38], "pitfal": [19, 38, 83], "pooyan": [19, 38], "50": [19, 53, 63, 69, 85, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "70": [19, 63], "privateey": 19, "qbert": [19, 38], "riverraid": [19, 38], "roadrunn": [19, 67], "robotank": [19, 38, 68], "seaquest": [19, 38], "ski": [19, 38], "solari": [19, 38], "spaceinvad": 19, "stargunn": 19, "tenni": [19, 38], "timepilot": 19, "tutankham": [19, 38], "upndown": [19, 77], "ventur": [19, 38], "videopinbal": [19, 79, 80], "wizardofwor": [19, 80], "yarsreveng": 19, "zaxxon": [19, 38], "oppos": 19, "ai": [19, 104], "mg": 19, "bellemar": 19, "naddaf": 19, "veness": 19, "platform": [19, 104], "journal": 19, "artifici": 19, "intellig": 19, "research": [19, 92, 98, 104], "2012": 19, "url": 19, "jair": 19, "php": 19, "articl": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "view": [19, 49, 104], "11182": 19, "250": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "160": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "enchant": [20, 36], "chalic": 20, "golden": 20, "castl": 20, "pick": [20, 43, 54, 67, 109, 111], "sword": 20, "bridg": [20, 66, 104], "magnet": 20, "fight": [20, 33, 56, 59, 104], "outmanoeuvr": 20, "dragon": 20, "flavor": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "switch": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 104], "thorough": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "discuss": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "intric": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "stochast": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 86, 87, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104, 109], "ship": [21, 22, 24, 30, 40, 49, 71], "sidewai": [21, 24, 30, 66, 70], "protect": [21, 27, 36, 37, 48, 53, 63], "saucer": [21, 26, 73], "try": [21, 22, 23, 32, 34, 39, 62, 63, 111], "drop": [21, 28, 109], "bomb": [21, 40, 52, 60, 73], "meaning": [21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 39, 41, 42, 43, 44, 53, 56, 58, 59, 60, 62, 63, 65, 70, 72, 73, 75, 76, 77, 79, 80], "210": [22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 40, 41, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "maze": [22, 23, 28, 31, 57, 76], "egg": 22, "scatter": [22, 64], "simultan": [22, 23], "kill": [22, 31, 50, 55], "flamethrow": 22, "tricki": 22, "situat": [22, 109], "occasion": [22, 26], "power": [22, 50, 84, 85, 90, 98, 99, 104], "pulsar": 22, "temporari": 22, "abil": 22, "score": [22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 50, 51, 52, 53, 54, 55, 61, 62, 63, 64, 65, 66, 67, 69, 73, 74, 75, 79, 83, 85], "prize": [22, 77], "caught": [22, 28], "lose": [22, 25, 27, 36, 39, 40, 43, 50, 52, 61, 62, 64, 66, 67, 69, 70, 71, 85, 106, 111], "consult": [22, 51, 52, 53, 54, 55], "pac": 23, "man": 23, "visit": [23, 43, 84], "grid": [23, 109, 111, 112], "chicken": [23, 35, 46], "catch": [23, 39, 45, 67], "travers": 23, "vehicl": [24, 29, 44, 53, 104], "big": [24, 45, 112], "mother": [24, 54, 63], "circl": [24, 112], "overhead": [24, 85], "deploi": 24, "drone": 24, "dodg": [24, 30, 69], "attack": [24, 26, 27, 30, 38, 40, 63], "horizont": [25, 35, 83, 85, 87, 112], "vertic": [25, 83, 98, 99, 104, 112], "lyre": 25, "guid": [25, 46, 104], "award": [25, 31, 36, 39, 43, 69, 98, 99], "field": [26, 104], "appear": [26, 28, 31, 68, 89, 90], "satellit": 26, "ufo": 26, "job": [27, 112], "submerg": 27, "citi": [27, 28, 64, 104], "slowli": 27, "descend": 27, "toward": [27, 51, 102], "strike": [27, 32], "distanc": [27, 44, 94, 112], "defens": [27, 42], "manag": [27, 32], "seven": 27, "fought": 27, "wave": [27, 37, 41, 53, 60, 73], "outer": [27, 87], "robber": 28, "natur": [28, 106, 108, 111], "rob": 28, "getawai": 28, "polic": 28, "chase": [28, 31], "dynamit": [28, 50], "ga": [28, 84], "tank": [28, 29, 69], "nine": [28, 93], "leav": [28, 88, 92, 98, 112], "person": [29, 87, 104], "perspect": [29, 104], "3d": [29, 93, 96, 97, 104, 111], "illus": 29, "radar": [29, 80], "travel": 30, "constant": [30, 69, 85, 90, 93, 95, 96, 103], "steer": [30, 77, 84], "debri": 30, "leftifir": 30, "evil": [31, 56, 81], "touch": [31, 64, 112], "wall": [31, 34, 50, 89, 90], "undefeat": 31, "otto": 31, "tri": 32, "knock": [32, 33], "pin": 32, "spar": 32, "spare": 32, "300": [32, 44, 83, 112], "oppon": [33, 45, 51, 62, 77], "ring": 33, "hit": [33, 34, 35, 36, 41, 63, 64, 67, 68, 70, 106, 111], "punch": [33, 54], "famou": 34, "paddl": [34, 62], "ball": [34, 51, 62, 79], "brick": 34, "wreak": 34, "havoc": 34, "five": [34, 64, 70, 86], "214": 35, "em": 35, "gun": [35, 43], "suppli": [35, 59, 113], "ammunit": 35, "steal": [35, 45], "bullet": [35, 104], "subtract": 35, "minu": 35, "sign": [35, 98, 99], "elf": 36, "magic": 36, "wand": 36, "fend": 36, "spider": 36, "flea": 36, "mushroom": 36, "forest": 36, "bitten": 36, "tempor": 36, "paralyz": 36, "scorpion": 36, "round": 36, "helicopt": [37, 39, 66], "truck": [37, 67], "convoi": 37, "aircraft": [37, 75], "mini": 37, "bottom": [37, 52, 84, 89, 90, 95, 103, 107], "plane": 37, "surviv": [37, 41], "bank": [38, 66], "heist": 38, "battl": 38, "zone": 38, "beam": [38, 50], "rider": 38, "chopper": 38, "command": [38, 92], "crazi": 38, "climber": 38, "demon": 38, "doubl": [38, 92], "dunk": 38, "elev": 38, "fish": 38, "derbi": 38, "ic": [38, 41, 47, 51], "hockei": [38, 51], "journei": [38, 53, 111], "kung": 38, "fu": 38, "master": [38, 107], "montezuma": 38, "reveng": 38, "pacman": 38, "privat": [38, 64, 112], "ey": [38, 59, 64, 104], "road": [38, 84], "runner": 38, "invad": [38, 72], "star": 38, "gunner": 38, "pilot": [38, 60, 81], "pinbal": 38, "wizard": [38, 56], "Of": 38, "wor": 38, "yar": 38, "builid": 39, "obstacl": [39, 53, 54], "fall": [39, 41, 61, 67, 83, 96, 108, 113], "damag": [39, 68], "climb": [39, 54, 86, 104], "fast": [39, 84, 92, 94, 96, 98, 102, 104], "least": [39, 74, 85], "row": [39, 72, 107, 108], "earth": [40, 72], "rescu": [40, 50, 54, 55, 56, 69, 71], "smart": 40, "shot": [40, 42, 43, 51, 52, 67, 104], "abduct": 40, "unlimit": 40, "laser": [40, 50, 72, 80], "missil": [40, 66], "aliv": [40, 96, 103], "face": [41, 93, 96, 97, 106, 111], "planet": [41, 49, 71], "krybor": 41, "accumul": 41, "reserv": [41, 66, 68, 69], "bunker": [41, 49], "increas": [41, 69, 85, 87, 88, 95, 102, 103, 111], "grant": [41, 85], "slai": 41, "2v2": 42, "basketbal": 42, "possess": 42, "rival": 42, "team": 42, "rule": [42, 74, 104, 106, 111], "foul": 42, "success": [42, 87, 109, 113], "secret": [43, 64], "ground": [43, 63, 83, 85, 93, 97, 104], "stair": 43, "equip": 43, "against": [43, 62, 74, 104], "floor": 43, "gather": [43, 64, 112], "apart": [43, 112], "mark": 43, "red": [43, 49, 112], "door": 43, "unreleas": 43, "prototyp": 43, "500": [43, 66, 87, 88, 109, 111], "racer": 44, "nation": 44, "long": [44, 79, 88, 98, 99], "endur": 44, "race": [44, 67, 70, 82], "overtak": 44, "dai": [44, 82], "stai": 44, "meet": 44, "quota": 44, "sunfish": 45, "But": [45, 70], "fisherman": 45, "black": [45, 55, 87, 111], "shark": [45, 59, 69], "lurk": [45, 65], "surfac": [45, 69, 98, 99, 112], "lane": [46, 104], "busi": 46, "rush": 46, "hour": 46, "traffic": 46, "cross": [46, 108], "bailei": 47, "who": [47, 48, 53, 54, 70], "hop": [47, 65, 95, 103], "forth": 47, "arctic": 47, "river": [47, 66], "block": [47, 104], "white": 47, "blue": [47, 49, 74, 87, 112], "he": [47, 49], "hi": [47, 49, 64], "igloo": 47, "shovel": 48, "wield": 48, "farmer": 48, "crop": 48, "carrot": 48, "spacecraft": 49, "fiction": 49, "solar": 49, "landscap": 49, "miner": 50, "mine": [50, 67], "shaft": 50, "tool": [50, 57], "propel": 50, "backpack": 50, "wherev": 50, "blast": [50, 69, 71], "vermin": 50, "raft": 50, "stretch": 50, "critter": 50, "remain": [50, 53, 54, 69, 93, 107, 112, 113], "standard": [51, 93, 94, 98, 104], "minut": [51, 61], "period": [51, 95, 103], "puck": 51, "angl": [51, 52, 83, 85, 87, 88, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "extrem": [51, 104, 105], "aim": [51, 95, 98, 102, 103], "rink": 51, "realli": [51, 111], "mr": 52, "bond": 52, "design": [52, 87, 93, 96, 97, 105, 109, 112], "multipurpos": 52, "craft": [52, 85], "varieti": [52, 104], "motion": [52, 104], "slightli": [52, 83, 93], "jump": [52, 67, 70], "dive": 52, "lob": 52, "rate": [52, 69, 111], "highest": [52, 104], "novic": 52, "006": 52, "007": 52, "lead": 53, "peski": 53, "backstag": 53, "scarab": 53, "000": [53, 66, 69], "concert": 53, "cash": 53, "grasp": 53, "groupi": 53, "photograph": 53, "promot": 53, "encount": [53, 54, 75, 104], "her": [54, 63], "preciou": 54, "babi": 54, "ladder": [54, 83], "bonu": [54, 68, 69, 73, 103], "fruit": 54, "monkei": 54, "corner": 54, "beast": 55, "fortress": [55, 57], "princess": [55, 56], "lyssa": 55, "sunris": 55, "monster": [55, 78], "templ": 56, "victoria": 56, "defeat": [56, 65], "acquir": [57, 92], "treasur": [57, 59, 61, 76, 78], "chamber": [57, 78], "emperor": 57, "deadli": 57, "creatur": [57, 65, 73, 104], "valuabl": 57, "pellet": 58, "ghost": 58, "discov": 59, "octopu": 59, "oxygen": [59, 69], "elimin": [60, 76, 77, 78], "war": 60, "bird": 60, "harri": 61, "jungl": 61, "die": [61, 63, 84], "misfortun": 61, "hole": [61, 108], "compet": 62, "deflect": 62, "pig": 63, "piglet": 63, "wolv": 63, "rope": 63, "balloon": 63, "guard": 63, "eat": [63, 67], "bait": 63, "wolf": 63, "stone": 63, "rock": [63, 67], "french": 64, "pierr": 64, "street": 64, "park": 64, "passag": 64, "dead": 64, "search": [64, 104], "ringlead": 64, "henri": 64, "le": 64, "fiend": 64, "gang": 64, "evid": 64, "stolen": 64, "good": [64, 111], "statut": 64, "expir": 64, "nab": 64, "question": [64, 104], "auto": 64, "pothol": 64, "bert": 65, "cube": 65, "pyramid": 65, "destin": [65, 109], "nasti": 65, "jet": 66, "fli": 66, "fuel": [66, 71, 85], "depot": 66, "collid": [66, 69, 85], "squadron": [66, 68], "tanker": 66, "80": 66, "tm": 67, "direct": [67, 69, 87, 88, 89, 90, 93, 95, 96, 98, 99, 103, 108, 112], "outrun": 67, "wile": 67, "coyot": 67, "hazard": 67, "desert": 67, "rocket": [67, 68, 85], "cannon": [67, 72], "cliff": [67, 105], "steel": 67, "pile": 67, "birdse": 67, "cannonbal": 67, "activ": [68, 112], "scrambl": 68, "static": 68, "interfer": 68, "becom": [68, 82, 113], "sensor": [68, 84], "report": [68, 83, 93, 96, 97], "flash": 68, "panel": 68, "earn": 68, "twelv": 68, "abl": [69, 113], "torpedo": 69, "diver": 69, "killer": 69, "deliv": [69, 109], "six": [69, 103], "explod": 69, "anyth": 69, "decreas": [69, 85], "almost": 69, "yoursub": 69, "blow": 69, "forc": [69, 71, 85, 88, 89, 90, 93, 96, 97, 98, 99], "less": [69, 83, 85, 98, 102], "worth": [69, 72], "90": [69, 111], "moment": 69, "skier": 70, "gate": [70, 104], "fastest": 70, "tree": 70, "slalom": 70, "penalti": 70, "warp": 71, "sector": 71, "feder": 71, "zylon": 71, "refuel": 71, "cadet": 71, "corridor": 71, "mania": [73, 75], "orang": 74, "win": [74, 106, 111], "margin": 74, "ti": 74, "sport": 74, "till": [74, 111], "technologi": 75, "increasingli": 75, "futur": 75, "difficult": [75, 88, 92, 98, 99], "rack": 76, "tomb": 76, "guardian": 76, "baja": 77, "bugger": 77, "dungeon": 78, "beat": [80, 106], "scanner": 80, "armi": 81, "enslav": 81, "galaxi": 81, "fighter": 81, "lunar": 82, "lander": 82, "toi": [82, 106, 107, 108, 109], "contribut": 82, "earli": [82, 104, 111], "oleg": [82, 83, 84, 85], "klimov": [82, 83, 84, 85], "popular": [82, 104, 111], "benchmark": [82, 104], "ever": 82, "joint": [83, 85, 87, 88, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "uneven": 83, "terrain": [83, 104], "hardcor": 83, "stump": 83, "1600": 83, "heurist": [83, 85], "demonstr": 83, "motor": [83, 102], "hip": [83, 93, 96, 97], "knee": [83, 96, 97], "hull": 83, "angular": [83, 85, 87, 88, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "leg": [83, 85, 93, 95, 96, 97, 103, 104], "contact": [83, 85, 92, 93, 96, 97, 98], "lidar": [83, 104], "rangefind": 83, "measur": [83, 91, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103], "far": [83, 84, 98, 100, 101, 104], "torqu": [83, 87, 91, 93, 94, 95, 96, 97, 100, 101, 102, 103], "cost": [83, 94, 95, 102, 103, 104], "better": 83, "stand": [83, 92, 93, 96, 97, 98, 99, 111], "slight": 83, "exce": [83, 106], "closest": 83, "trace": 83, "furthest": 83, "faster": [83, 85, 97], "spent": [83, 85], "higher": 83, "friction": [83, 102, 104], "nervous": 83, "easiest": 84, "ab": [84, 104], "wheel": 84, "gyroscop": 84, "car_rac": 84, "rear": 84, "drive": [84, 109], "acceler": [84, 89, 90, 91], "noth": [84, 85], "brake": 84, "96x96": 84, "tile": 84, "732": 84, "926": 84, "rest": [84, 85, 95, 103], "playfield": 84, "lap_complete_perc": 84, "dictat": [84, 85], "percentag": [84, 111], "lap": 84, "domain_random": 84, "variant": [84, 112], "scenario": [84, 104], "background": 84, "demand": 84, "correspondingli": 84, "init": [84, 112], "scheme": [84, 104], "chri": 84, "campbel": 84, "2014": 84, "www": 84, "iforce2d": 84, "net": [84, 106], "b2dtut": 84, "pontryagin": 85, "principl": 85, "engin": [85, 92], "throttl": 85, "why": 85, "pad": 85, "infinit": [85, 95, 103, 106, 111, 113], "lunar_land": 85, "orient": [85, 93, 96, 97], "sum": [85, 93, 94, 95, 96, 97, 100, 101, 102, 103, 106, 111], "closer": [85, 106], "slower": 85, "tilt": 85, "03": 85, "solut": [85, 111], "viewport": 85, "mass": [85, 93, 94, 96, 97, 102, 104], "bodi": [85, 92, 93, 94, 95, 96, 97, 98, 99, 102, 103], "moon": 85, "greater": [85, 87, 88, 89, 90, 94, 99, 100, 102, 106, 111], "awak": 85, "group": 85, "come": [85, 93, 94, 95, 96, 97, 98, 99, 102, 103], "sleep": 85, "littl": [85, 97], "cpu": 85, "wake": 85, "attach": [85, 88, 91, 93, 103], "graviti": [85, 88, 89, 91, 98, 99, 104], "enable_wind": 85, "wind_pow": 85, "turbulence_pow": 85, "later": [85, 111], "booster": 85, "gravit": 85, "wind": 85, "tanh": 85, "sin": [85, 91, 98], "pi": [85, 87, 91], "9999": 85, "rotat": [85, 87, 93, 96, 97, 100, 111], "turbul": 85, "renorm": 85, "harder": 85, "push": [85, 88, 98, 99, 104], "cart": [86, 98, 99], "nois": [86, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "regard": 86, "underpow": 86, "effort": 86, "easier": 86, "ones": [86, 92, 111], "57": 87, "spars": [87, 112], "coars": 87, "barto": [87, 88, 98, 99, 106, 107, 111], "book": [87, 106, 111], "link": [87, 93, 94, 95, 96, 97, 101, 102], "linearli": [87, 98, 99], "actuat": [87, 88, 96, 97], "swing": [87, 91], "free": [87, 91, 92, 93, 96, 97, 98, 99, 104, 111], "height": [87, 95, 98, 103], "hang": 87, "downward": 87, "seen": [87, 94, 104], "green": 87, "cosin": [87, 98, 101], "theta1": 87, "sine": [87, 98, 101], "theta2": 87, "567": 87, "274": 87, "4\u03c0": 87, "9\u03c0": 87, "rad": [87, 88, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "incur": [87, 107], "co": [87, 89, 90, 91, 98, 101, 104], "book_or_nip": 87, "neurip": [87, 104], "paper": [87, 98, 104], "nip": [87, 104], "equat": [87, 91], "confirm": 87, "experiment": 87, "radian": [87, 88, 91, 99], "1996": 87, "touretzki": 87, "mozer": 87, "hasselmo": 87, "ed": [87, 109], "vol": 87, "mit": [87, 111], "proceed": 87, "cc": 87, "1995": 87, "8f1d43620bc6bb580df6e80b0dc05c48": 87, "pdf": 87, "anderson": [88, 98, 99], "neuronlik": [88, 98, 99], "adapt": [88, 98, 99, 107], "That": 88, "un": 88, "frictionless": 88, "balanc": [88, 98, 99], "vari": [88, 98, 99, 104], "418": 88, "untermin": 88, "2095": 88, "allot": 88, "475": 88, "05": [88, 93, 94, 100], "07": [89, 90], "sinusoid": [89, 90], "vallei": [89, 90], "strateg": [89, 90], "hill": [89, 90], "andrew": [89, 90], "moor": [89, 90], "phd": [89, 90, 102], "thesi": [89, 90, 102], "1990": [89, 90], "techreport": [89, 90], "moore90efficientmemori": [89, 90], "author": [89, 90, 111], "william": [89, 90], "institut": [89, 90], "univers": [89, 90], "cambridg": [89, 90], "year": [89, 90], "001": [89, 91, 95, 98, 103, 111], "0025": [89, 90], "collis": [89, 90], "inelast": [89, 90], "upon": [89, 90], "quickli": [89, 111], "penalis": [89, 90, 93, 94, 95, 96, 97, 98, 100, 101, 102, 103], "equal": [89, 90, 98, 106, 108], "0015": 90, "45": [90, 97, 100], "999": 90, "invert": [91, 92], "swingup": 91, "diagram": 91, "meter": 91, "theta": 91, "tau": 91, "counter": 91, "clockwis": 91, "theta_dt": 91, "heta": 91, "2736044": 91, "calcul": [91, 92, 93, 96, 97, 98, 100, 101, 108], "math": 91, "half": 92, "cheetah": 92, "standup": 92, "facilit": [92, 104], "develop": 92, "biomechan": 92, "graphic": [92, 104], "anim": 92, "area": 92, "accur": [92, 104], "octob": 92, "2021": [92, 104], "deepmind": [92, 104], "2022": 92, "everyon": 92, "instruct": [92, 112], "websit": [92, 104], "framework": 92, "ten": [92, 106, 111], "iverteddoublependulum": 92, "gaussian": 92, "mjsim": 92, "qpo": 92, "qvel": [92, 96, 97], "indirectli": 92, "xml": [92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "tweak": [92, 102], "schulman": 93, "moritz": 93, "levin": 93, "jordan": 93, "abbeel": 93, "advantag": [93, 104, 112], "estim": [93, 113], "torso": [93, 94, 95, 96, 97, 103], "eight": 93, "hing": [93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "rotor": [93, 94, 95, 96, 97, 102, 103], "front": [93, 94, 102, 104], "hip_1": [93, 96, 97], "front_left_leg": [93, 96, 97], "angle_1": [93, 96, 97], "hip_2": [93, 96, 97], "front_right_leg": [93, 96, 97], "angle_2": 93, "hip_3": 93, "back_leg": 93, "angle_3": 93, "hip_4": 93, "right_back_leg": 93, "angle_4": 93, "deriv": [93, 94, 95, 96, 97, 98, 99, 102, 103], "exclude_current_positions_from_observ": [93, 94, 95, 96, 102, 103], "113": 93, "regardless": [93, 94, 95, 96, 102, 103], "x_posit": [93, 94, 95, 96, 102, 103], "y_posit": [93, 96, 102], "111": 93, "centr": [93, 96, 97], "ankle_1": 93, "ankle_2": 93, "ankle_3": 93, "ankle_4": 93, "19": [93, 96, 97, 100], "23": [93, 96, 97, 100, 104], "translat": [93, 96, 97, 112], "dof": [93, 96, 97], "quaternion": [93, 96, 97], "healthy_reward": [93, 95, 96, 103], "healthi": [93, 95, 96, 103], "forward_reward": [93, 94, 95, 96, 102, 103], "dt": [93, 94, 95, 96, 100, 101, 102, 103], "frametim": [93, 94, 95, 96, 102, 103], "ctrl_cost": [93, 94, 95, 96, 102, 103], "too": [93, 94, 95, 96, 97, 98, 100, 101, 102, 103], "ctrl_cost_weight": [93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "ctr_cost_weight": 93, "contact_cost": [93, 96], "contact_cost_weight": [93, 96], "contact_force_rang": 93, "reset_noise_scal": [93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "deviat": [93, 94, 98, 102], "intention": [93, 96, 97], "therebi": [93, 96, 97], "said": [93, 95, 96, 103], "unhealthi": [93, 95, 96, 103], "healthy_z_rang": [93, 95, 96, 103], "terminate_when_unhealthi": [93, 95, 96, 103], "xml_file": [93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "path": [93, 94, 95, 96, 100, 101, 102, 103], "model": [93, 94, 95, 96, 102, 103, 104, 111], "5e": [93, 95, 96, 103], "perturb": [93, 94, 95, 96, 102, 103], "exclud": [93, 94, 95, 96, 102, 103], "induct": [93, 94, 95, 96, 102, 103], "bia": [93, 94, 95, 96, 102, 103], "induc": [93, 94, 95, 96, 102, 103], "agnost": [93, 94, 95, 96, 97, 102, 103], "bind": [93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "camera": [93, 94, 95, 96, 97, 98, 99, 102, 103, 104], "mujoco_pi": [93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "max_time_step": [93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "wawrzy\u0144ski": 94, "cat": 94, "paw": 94, "alloc": 94, "thigh": [94, 95, 96, 97, 103], "shin": [94, 96, 97], "feet": [94, 103], "bthigh": 94, "bshin": 94, "bfoot": 94, "fthigh": 94, "fshin": 94, "ffoot": 94, "tip": [94, 98, 102], "rootz": [94, 95, 103], "slide": [94, 95, 98, 99, 100, 101, 102, 103], "rooti": [94, 95, 103], "rootx": [94, 95, 103], "forward_reward_weight": [94, 95, 96, 102, 103], "half_cheetah": 94, "erez": [95, 96, 97, 103], "tassa": [95, 96, 97, 103], "todorov": [95, 96, 97, 103], "predict": [95, 103], "nonlinear": [95, 103], "compar": [95, 102, 103, 111], "figur": [95, 103, 111], "middl": [95, 103], "thigh_joint": [95, 103], "leg_joint": [95, 103], "foot_joint": [95, 103], "002": [95, 103], "008": [95, 103], "els": [95, 103, 108, 111, 112], "healthy_state_rang": 95, "fallen": 95, "healthy_angle_rang": [95, 103], "376": [96, 97], "synthesi": [96, 97, 104], "onlin": [96, 97, 104], "abdomen": [96, 97], "pair": [96, 97], "arm": [96, 97, 100, 101, 104], "elbow": [96, 97, 100], "walk": [96, 103, 105, 108, 112], "right_hip_x": [96, 97], "right_thigh": [96, 97], "right_hip_z": [96, 97], "right_hip_i": [96, 97], "right_kne": [96, 97], "left_hip_x": [96, 97], "left_thigh": [96, 97], "left_hip_z": [96, 97], "left_hip_i": [96, 97], "left_kne": [96, 97], "right_shoulder1": [96, 97], "right_shoulder2": [96, 97], "right_elbow": [96, 97], "left_shoulder1": [96, 97], "left_shoulder2": [96, 97], "left_elbow": [96, 97], "378": 96, "root": [96, 97], "lower_waist": [96, 97], "abdomen_z": [96, 97], "abdomen_i": [96, 97], "pelvi": [96, 97], "abdomen_x": [96, 97], "right_upper_arm": [96, 97], "right_lower_arm": [96, 97], "left_upper_arm": [96, 97], "left_lower_arm": [96, 97], "anglular": [96, 97, 99], "29": [96, 97], "aanglular": [96, 97], "33": [96, 97], "34": 96, "35": [96, 97], "37": [96, 97], "39": [96, 97], "41": [96, 97], "43": [96, 97], "velocitti": 96, "addition": [96, 97], "cinert": [96, 97], "inertia": [96, 97], "rigid": [96, 97], "intermedi": [96, 97], "nbodi": [96, 97], "henc": [96, 97, 105], "140": [96, 97], "cvel": [96, 97], "qfrc_actuat": [96, 97], "constraint": [96, 97, 98, 104], "nv": [96, 97], "cfrc_ext": [96, 97], "dim": [96, 97], "003": 96, "015": 96, "nu": [96, 97], "contact_cost_rang": 96, "lai": 97, "state_spac": 97, "uph_cost": 97, "upward": 97, "absolut": [97, 99, 103], "overal": 97, "atom": 97, "movement": [97, 112], "though": 97, "inflat": 97, "quad_ctrl_cost": 97, "quad_impact_cost": 97, "000001": 97, "105": 97, "unlik": [97, 98, 99, 100, 101], "beyond": [97, 98, 99, 100, 101, 103], "slider": [98, 99], "unitless": [98, 101], "hinge2": 98, "realist": [98, 104], "accuraci": [98, 104], "approach": [98, 111, 112], "analyt": 98, "alive_bonu": 98, "distance_penalti": 98, "velocity_penalti": 98, "005": [98, 100, 101], "y_coordin": 98, "196": 98, "perpendicularli": 98, "cylind": 100, "effector": [100, 101], "fingertip": [100, 101], "shoulder": 100, "forearm": 100, "wrist": 100, "pan": 100, "r_shoulder_pan_joint": 100, "lift": 100, "r_shoulder_lift_joint": 100, "r_upper_arm_roll_joint": 100, "flex": 100, "r_elbow_flex_joint": 100, "r_forearm_roll_joint": 100, "r_wrist_flex_joint": 100, "r_wrist_roll_joint": 100, "analogi": 100, "tips_arm": 100, "obj_slidex": 100, "obj_slidei": 100, "goal_slidex": 100, "goal_slidei": 100, "sphere": 100, "reward_near": 100, "unattach": [100, 101], "reward_control": [100, 101], "euclidean": [100, 101], "perman": 100, "323": 100, "rise": 100, "asset": [100, 101], "gymnasmium": 100, "fixtur": 101, "joint0": 101, "joint1": 101, "target_x": 101, "target_i": 101, "position_fingertip": 101, "position_target": 101, "na": [101, 104], "disk": 101, "radiu": 101, "everyth": 101, "02": 101, "r\u00e9mi": 102, "coulom": 102, "applic": [102, 104], "segment": 102, "articul": [102, 104], "suspend": 102, "subject": [102, 104], "fluid": 102, "viscou": 102, "coeffici": 102, "motor1_rot": 102, "motor2_rot": 102, "\u03b8": 102, "free_body_rot": 102, "slider1": 102, "slider2": 102, "04": 102, "swim": 102, "split": 103, "thigh_left_joint": 103, "leg_left_joint": 103, "foot_left_joint": 103, "ctr_cost": 103, "compli": 104, "maintain": [104, 110], "encourag": 104, "interest": 104, "clone": [104, 112], "huge": 104, "3v3": 104, "hundr": 104, "roughli": 104, "tweakabl": 104, "monei": 104, "slime": 104, "volleybal": 104, "motiv": 104, "premad": 104, "minatar": 104, "foss": 104, "interoper": 104, "synthes": 104, "neuro": 104, "architectur": 104, "integr": 104, "twin": 104, "concept": 104, "seamless": 104, "transfer": 104, "hardwar": 104, "world": [104, 109], "firmwar": 104, "neuroflight": 104, "extens": 104, "ro": 104, "thrust": 104, "ascend": 104, "shall": 104, "altitud": 104, "aerodynam": 104, "drag": 104, "light": 104, "poli": 104, "pinocchio": 104, "meshcat": 104, "web": 104, "bitcraz": 104, "crazyfli": 104, "nanoquadrotor": 104, "mar": 104, "ggym": 104, "endeavor": 104, "gap": 104, "deep": [104, 113], "methodologi": 104, "coverag": 104, "laboratori": 104, "internet": 104, "musculoskelet": 104, "opensim": 104, "physiolog": 104, "competit": 104, "2017": 104, "challeng": [104, 111], "quadrotor": 104, "casadi": 104, "symbol": 104, "priori": 104, "miniatur": 104, "racecar": 104, "portabl": 104, "accompani": 104, "ostrich": 104, "studi": 104, "bio": 104, "mechan": 104, "locomot": 104, "soft": 104, "dual": 104, "dexter": 104, "hand": 104, "manipul": 104, "isaac": 104, "omnivers": 104, "virtual": [104, 112], "ego": 104, "cloud": 104, "semant": 104, "cours": 104, "wide": 104, "account": 104, "yield": 104, "voltag": 104, "duti": 104, "cycl": 104, "plan": 104, "emphasi": 104, "percept": 104, "social": 104, "driver": 104, "whose": [104, 106], "uncertain": 104, "propos": 104, "merg": 104, "intersect": 104, "roundabout": 104, "longitudin": 104, "comprehens": 104, "trackmania": 104, "2020": 104, "latent": 104, "torc": 104, "bandit": 104, "server": 104, "advertis": 104, "greedi": [104, 111], "softmax": 104, "ucb1": 104, "strive": 104, "novel": 104, "taobao": 104, "largest": 104, "commerc": 104, "omg": 104, "toolbox": 104, "electron": 104, "minimalist": 104, "wireless": 104, "elastica": 104, "assembli": 104, "slender": 104, "cosserat": 104, "rod": 104, "trade": 104, "great": [104, 111], "focu": 104, "simplic": 104, "brax": 104, "compil": 104, "llvm": 104, "phase": 104, "gcc": 104, "cuda": 104, "hyperparamet": [104, 111], "cheap": 104, "surrog": 104, "evolutionari": 104, "autom": 104, "deduct": 104, "verif": 104, "cell": [104, 107, 112], "metatrad": 104, "techniqu": 104, "hard": 104, "transport": 104, "puzzl": 104, "warehous": 104, "storag": 104, "overfit": 104, "predefin": [104, 112], "mathemat": 104, "dataset": 104, "arxiv": 104, "2107": 104, "07373": 104, "baselin": 104, "expos": 104, "blockqnn": 104, "wise": 104, "nsc": 104, "cifar": 104, "meta": 104, "tag": 104, "answer": 104, "classif": 104, "procedur": 104, "quantum": 104, "circuit": 104, "wire": 104, "qubit": 104, "googl": 104, "quantumai": 104, "cirq": 104, "morl": 104, "theorem": 104, "prover": 104, "vampir": 104, "theoret": 104, "workshop": 104, "f1tenth": 104, "twisti": 104, "evolut": 104, "propuls": 104, "music": 104, "jax": 104, "frozen": 105, "lake": 105, "suitabl": 105, "card": [106, 111], "dealer": [106, 111], "jack": 106, "queen": 106, "king": 106, "ac": [106, 111], "usabl": [106, 111], "deck": [106, 111], "decid": [106, 108], "bust": [106, 111], "reveal": 106, "facedown": 106, "goe": 106, "outcom": 106, "incompleteidea": 106, "2nd": 106, "html": 106, "sab": [106, 111], "48": 107, "106": 107, "With": [107, 111], "inspir": 107, "dennybritz": 107, "blob": 107, "cliff_walk": 107, "board": 107, "4x12": 107, "3x12": 107, "fact": 107, "encod": [107, 109, 112], "slipperi": 108, "dir": 108, "current_row": 108, "nrow": 108, "current_col": 108, "col": 108, "4x4": 108, "desc": 108, "map_nam": 108, "is_slipperi": 108, "sfff": 108, "fhfh": 108, "fffh": 108, "hffg": 108, "generate_random_map": 108, "toy_text": [108, 111], "frozen_lak": 108, "preload": 108, "8x8": 108, "sfffffff": 108, "ffffffff": 108, "fffhffff": 108, "fffffhff": 108, "fhhfffhf": 108, "fhffhfhf": 108, "fffhfffg": 108, "perpendicular": 108, "bug": [108, 109], "maxq": 109, "decomposit": 109, "tom": 109, "dietterich": 109, "reen": 109, "ellow": 109, "lue": 109, "passeng": 109, "south": 109, "north": 109, "east": 109, "west": 109, "pickup": 109, "404": 109, "reachabl": 109, "taxi_row": 109, "taxi_col": 109, "passenger_loc": 109, "decod": 109, "action_mask": 109, "Or": 109, "argmax": [109, 111], "q_valu": [109, 111], "illeg": 109, "cleaner": 109, "disallow": 109, "loc": 109, "passidx": 109, "capabl": 110, "insert": 110, "casino": 111, "infam": 111, "beatabl": 111, "won": 111, "viabl": 111, "strategi": 111, "favorit": 111, "zemann": 111, "__future__": 111, "annot": 111, "defaultdict": 111, "pyplot": 111, "plt": 111, "seaborn": 111, "sn": 111, "patch": 111, "tqdm": 111, "next_stat": 111, "explanatori": 111, "tell": [111, 113], "idea": [111, 113], "slow": 111, "showcas": 111, "respond": 111, "harm": 111, "blackjackag": 111, "learning_r": 111, "initial_epsilon": 111, "epsilon_decai": 111, "final_epsilon": 111, "discount_factor": 111, "95": 111, "arg": 111, "decai": 111, "lr": 111, "training_error": 111, "get_act": 111, "greedili": 111, "exploit": 111, "next_ob": 111, "future_q_valu": 111, "temporal_differ": 111, "decay_epsilon": 111, "readi": 111, "n_episod": 111, "100_000": 111, "start_epsilon": 111, "decent": 111, "converg": 111, "10x": 111, "rolling_length": 111, "fig": 111, "subplot": 111, "ncol": 111, "figsiz": 111, "set_titl": 111, "reward_moving_averag": 111, "convolv": 111, "length_moving_averag": 111, "training_error_moving_averag": 111, "tight_layout": 111, "create_grid": 111, "usable_ac": 111, "state_valu": 111, "action_valu": 111, "player_count": 111, "dealer_count": 111, "meshgrid": 111, "arang": 111, "apply_along_axi": 111, "arr": 111, "dstack": 111, "value_grid": 111, "policy_grid": 111, "create_plot": 111, "figaspect": 111, "suptitl": 111, "fontsiz": 111, "ax1": 111, "add_subplot": 111, "plot_surfac": 111, "rstride": 111, "cstride": 111, "cmap": 111, "viridi": 111, "edgecolor": 111, "xtick": 111, "ytick": 111, "set_xlabel": 111, "set_ylabel": 111, "zaxi": 111, "set_rotate_label": 111, "set_zlabel": 111, "view_init": 111, "220": 111, "ax2": 111, "heatmap": 111, "linewidth": 111, "accent_r": 111, "cbar": 111, "set_xticklabel": 111, "set_yticklabel": 111, "legend": 111, "legend_el": 111, "facecolor": 111, "lightgreen": 111, "label": 111, "grei": 111, "bbox_to_anchor": 111, "fig1": 111, "fig2": 111, "hopefulli": 111, "grip": 111, "mont": 111, "carlo": 111, "fun": 111, "blackjack_tutori": 111, "jupyt": [111, 112, 113], "ipynb": [111, 112, 113], "overview": 112, "git": 112, "venv": 112, "bin": 112, "concern": 112, "readm": 112, "setup": 112, "gym_exampl": 112, "grid_world": 112, "relative_posit": 112, "reacher_weighted_reward": 112, "discrete_act": 112, "clip_reward": 112, "illustr": [112, 113], "simplist": 112, "gridworldenv": 112, "piec": 112, "abstract": 112, "window_s": 112, "512": 112, "_action_to_direct": 112, "assert": 112, "clock": 112, "_get_ob": 112, "mandatori": 112, "_agent_loc": 112, "_target_loc": 112, "manhattan": 112, "_get_info": 112, "oftentim": 112, "worri": 112, "coincid": 112, "earlier": 112, "array_equ": 112, "_render_fram": 112, "trivial": 112, "skeleton": 112, "set_mod": 112, "canva": 112, "pix_square_s": 112, "rect": 112, "gridlin": 112, "width": 112, "visibl": 112, "blit": 112, "get_rect": 112, "pump": 112, "delai": 112, "stabl": 112, "tick": 112, "surfarrai": 112, "pixels3d": 112, "bother": 112, "detect": 112, "put": 112, "registr": 112, "appropri": 112, "entrypoint": 112, "mere": 112, "explicitli": [112, 113], "third": 112, "parti": 112, "codebas": 112, "edit": 112, "setuptool": 112, "install_requir": 112, "local": 112, "perfectli": 112, "fine": 112, "did": 113, "failur": 113, "notabl": 113, "inher": 113, "preserv": 113, "obviou": 113, "forev": 113, "forcibli": 113, "halt": 113, "formal": 113, "q_": 113, "o_t": 113, "a_t": 113, "r_t": 113, "max_a": 113, "o_": 113, "a_": 113, "q_target": 113, "distinct": 113, "frequent": 113, "differenti": 113, "vf_target": 113, "vf_next_stat": 113, "onward": 113, "handling_time_limit": 113}, "objects": {"Space": [[4, 0, 1, "", "dtype"]], "": [[10, 1, 1, "", "action_space"], [10, 1, 1, "", "observation_space"], [10, 1, 1, "", "single_action_space"], [10, 1, 1, "", "single_observation_space"]], "gymnasium": [[12, 2, 1, "", "ActionWrapper"], [2, 2, 1, "", "Env"], [14, 2, 1, "", "ObservationWrapper"], [15, 2, 1, "", "RewardWrapper"], [11, 2, 1, "", "Wrapper"], [3, 3, 1, "", "make"], [3, 3, 1, "", "register"], [3, 3, 1, "", "spec"]], "gymnasium.ActionWrapper.ActionWrapper": [[12, 3, 1, "", "action"]], "gymnasium.Env": [[2, 1, 1, "", "action_space"], [2, 3, 1, "", "close"], [2, 1, 1, "", "metadata"], [2, 0, 1, "", "np_random"], [2, 1, 1, "", "observation_space"], [2, 3, 1, "", "render"], [2, 1, 1, "", "render_mode"], [2, 3, 1, "", "reset"], [2, 1, 1, "", "reward_range"], [2, 1, 1, "", "spec"], [2, 3, 1, "", "step"], [2, 0, 1, "", "unwrapped"]], "gymnasium.ObservationWrapper": [[14, 3, 1, "", "observation"]], "gymnasium.RewardWrapper.RewardWrapper": [[15, 3, 1, "", "reward"]], "gymnasium.Wrapper": [[11, 0, 1, "", "action_space"], [11, 3, 1, "", "close"], [11, 0, 1, "", "metadata"], [11, 0, 1, "", "np_random"], [11, 0, 1, "", "observation_space"], [11, 3, 1, "", "reset"], [11, 0, 1, "", "reward_range"], [11, 0, 1, "", "spec"], [11, 3, 1, "", "step"], [11, 0, 1, "", "unwrapped"]], "gymnasium.spaces": [[6, 2, 1, "", "Box"], [5, 2, 1, "", "Dict"], [6, 2, 1, "", "Discrete"], [5, 2, 1, "", "Graph"], [6, 2, 1, "", "MultiBinary"], [6, 2, 1, "", "MultiDiscrete"], [5, 2, 1, "", "Sequence"], [4, 2, 1, "", "Space"], [6, 2, 1, "", "Text"], [5, 2, 1, "", "Tuple"]], "gymnasium.spaces.Box": [[6, 4, 1, "", "is_bounded"], [6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Dict": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.Discrete": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Graph": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.MultiBinary": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.MultiDiscrete": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Sequence": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.Text": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Tuple": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.space.Space": [[4, 3, 1, "", "contains"], [4, 3, 1, "", "from_jsonable"], [4, 3, 1, "", "sample"], [4, 3, 1, "", "seed"], [4, 0, 1, "", "shape"], [4, 3, 1, "", "to_jsonable"]], "gymnasium.spaces.utils": [[7, 3, 1, "", "flatdim"], [7, 3, 1, "", "flatten"], [7, 3, 1, "", "flatten_space"], [7, 3, 1, "", "unflatten"]], "gymnasium.utils.env_checker": [[9, 3, 1, "", "check_env"]], "gymnasium.utils.play": [[9, 2, 1, "", "PlayPlot"], [9, 2, 1, "", "PlayableGame"], [9, 3, 1, "", "play"]], "gymnasium.utils.play.PlayPlot": [[9, 4, 1, "", "callback"]], "gymnasium.utils.play.PlayableGame": [[9, 4, 1, "", "process_event"]], "gymnasium.utils.save_video": [[9, 3, 1, "", "capped_cubic_video_schedule"], [9, 3, 1, "", "save_video"]], "gymnasium.utils.seeding": [[9, 3, 1, "", "np_random"]], "gymnasium.utils.step_api_compatibility": [[9, 3, 1, "", "convert_to_done_step_api"], [9, 3, 1, "", "convert_to_terminated_truncated_step_api"], [9, 3, 1, "", "step_api_compatibility"]], "gymnasium.vector": [[10, 2, 1, "", "AsyncVectorEnv"], [10, 2, 1, "", "SyncVectorEnv"], [10, 2, 1, "", "VectorEnv"], [10, 3, 1, "", "make"]], "gymnasium.vector.VectorEnv": [[10, 4, 1, "", "close"], [10, 4, 1, "", "reset"], [10, 4, 1, "", "step"]], "gymnasium.vector.utils": [[8, 3, 1, "", "batch_space"], [8, 3, 1, "", "concatenate"], [8, 3, 1, "", "create_empty_array"], [8, 3, 1, "", "create_shared_memory"], [8, 3, 1, "", "iterate"], [8, 3, 1, "", "read_from_shared_memory"], [8, 3, 1, "", "write_to_shared_memory"]], "gymnasium.wrappers": [[13, 2, 1, "", "AtariPreprocessing"], [13, 2, 1, "", "AutoResetWrapper"], [12, 2, 1, "", "ClipAction"], [13, 2, 1, "", "EnvCompatibility"], [14, 2, 1, "", "FilterObservation"], [14, 2, 1, "", "FlattenObservation"], [14, 2, 1, "", "FrameStack"], [14, 2, 1, "", "GrayScaleObservation"], [13, 2, 1, "", "HumanRendering"], [14, 2, 1, "", "NormalizeObservation"], [15, 2, 1, "", "NormalizeReward"], [13, 2, 1, "", "OrderEnforcing"], [13, 2, 1, "", "PassiveEnvChecker"], [14, 2, 1, "", "PixelObservationWrapper"], [13, 2, 1, "", "RecordEpisodeStatistics"], [13, 2, 1, "", "RecordVideo"], [13, 2, 1, "", "RenderCollection"], [12, 2, 1, "", "RescaleAction"], [14, 2, 1, "", "ResizeObservation"], [13, 2, 1, "", "StepAPICompatibility"], [14, 2, 1, "", "TimeAwareObservation"], [13, 2, 1, "", "TimeLimit"], [14, 2, 1, "", "TransformObservation"], [15, 2, 1, "", "TransformReward"], [13, 2, 1, "", "VectorListInfo"]]}, "objtypes": {"0": "py:property", "1": "py:attribute", "2": "py:class", "3": "py:function", "4": "py:method"}, "objnames": {"0": ["py", "property", "Python property"], "1": ["py", "attribute", "Python attribute"], "2": ["py", "class", "Python class"], "3": ["py", "function", "Python function"], "4": ["py", "method", "Python method"]}, "titleterms": {"404": 0, "page": [0, 1], "Not": 0, "found": 0, "The": 0, "request": 0, "could": 0, "gymnasium": [1, 2, 10, 11, 110, 112], "doc": 1, "instruct": 1, "modifi": [1, 16], "environ": [1, 2, 3, 9, 10, 13, 16, 17, 18, 104, 110, 111, 112], "edit": 1, "an": [1, 111], "ad": 1, "new": [1, 9], "atari": [1, 13, 19, 38], "env": [1, 2, 10, 104, 112], "non": 1, "other": [1, 104], "step": [1, 9, 17, 18], "build": [1, 111], "document": 1, "write": 1, "tutori": 1, "method": [2, 4, 10, 11], "attribut": [2, 4, 10, 11], "addit": 2, "implement": [2, 11], "registri": 3, "make": [3, 10, 112], "regist": [3, 112], "all": 3, "spec": 3, "space": [4, 5, 6, 7, 8, 16, 19, 45, 46, 47, 48, 49, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 108], "fundament": [4, 6], "composit": [4, 5], "util": [4, 7, 8, 9], "vector": [4, 8, 10, 13], "dict": 5, "tupl": 5, "sequenc": 5, "graph": 5, "box": [6, 33], "discret": 6, "multibinari": 6, "multidiscret": 6, "text": [6, 105], "share": 8, "memori": 8, "visual": [9, 111], "save": 9, "render": [9, 13, 18], "video": [9, 13, 79, 104], "old": 9, "api": [9, 17, 110], "compat": [9, 13, 17], "seed": [9, 18], "check": 9, "vectorenv": 10, "async": 10, "sync": 10, "wrapper": [11, 12, 13, 14, 15, 112], "custom": [11, 112], "action": [12, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109, 111], "clip": 12, "rescal": 12, "misc": 13, "preprocess": 13, "autoreset": 13, "passiv": 13, "checker": 13, "human": 13, "order": 13, "enforc": 13, "record": 13, "episod": [13, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "statist": 13, "collect": [13, 110], "time": [13, 14, 113], "limit": [13, 113], "list": [13, 38], "info": [13, 109], "observ": [14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109, 111], "transform": [14, 15], "filter": 14, "flatten": 14, "framestack": 14, "grai": 14, "scale": 14, "normal": [14, 15], "pixel": 14, "resiz": 14, "awar": 14, "reward": [15, 19, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109], "basic": 16, "usag": 16, "initi": [16, 112], "interact": 16, "explain": 16, "code": [16, 18, 113], "more": 16, "inform": 16, "gym": [17, 104], "load": 17, "openai": 17, "v0": 17, "22": 17, "v21": 18, "v26": 18, "migrat": 18, "guid": 18, "exampl": 18, "random": 18, "number": 18, "gener": 18, "reset": [18, 84], "remov": 18, "autorom": 19, "instal": 19, "rom": 19, "stochast": 19, "common": 19, "argument": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109], "version": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109], "histori": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 108, 109], "name": [19, 59], "scheme": 19, "flavor": 19, "refer": [19, 84, 87, 110], "adventur": 20, "descript": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 106, 107, 109], "air": 21, "raid": 21, "alien": 22, "amidar": 23, "assault": 24, "asterix": 25, "asteroid": 26, "atlanti": 27, "bank": 28, "heist": 28, "battl": 29, "zone": 29, "beam": 30, "rider": 30, "berzerk": 31, "bowl": 32, "breakout": 34, "carniv": 35, "centiped": 36, "chopper": 37, "command": 37, "complet": 38, "crazi": 39, "climber": 39, "defend": 40, "demon": 41, "attack": 41, "doubl": [42, 98], "dunk": 42, "elev": 43, "enduro": 44, "fishingderbi": 45, "freewai": 46, "frostbit": 47, "gopher": 48, "gravitar": 49, "hero": 50, "icehockei": 51, "jamesbond": 52, "journeyescap": 53, "kangaroo": 54, "krull": 55, "kung": 56, "fu": 56, "master": 56, "montezuma": 57, "reveng": 57, "m": 58, "pacman": 58, "thi": 59, "game": [59, 104], "phoenix": 60, "pitfal": 61, "pong": 62, "pooyan": 63, "privateey": 64, "qbert": 65, "riverraid": 66, "road": 67, "runner": 67, "robot": [68, 104], "tank": 68, "seaquest": 69, "ski": 70, "solari": 71, "spaceinvad": 72, "stargunn": 73, "tenni": 74, "timepilot": 75, "tutankham": 76, "up": 77, "n": 77, "down": 77, "ventur": 78, "pinbal": 79, "wizard": 80, "wor": 80, "zaxxon": 81, "box2d": 82, "biped": 83, "walker": 83, "start": [83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "state": [83, 84, 85, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "termin": [83, 84, 85, 113], "credit": [83, 84, 85], "car": [84, 89, 90], "race": [84, 104], "lunar": 85, "lander": 85, "classic": 86, "control": [86, 104], "acrobot": 87, "end": [87, 88, 89, 90, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103], "cart": 88, "pole": 88, "mountain": [89, 90], "transit": [89, 90], "dynam": [89, 90], "continu": 90, "pendulum": [91, 98, 99], "truncat": [91, 113], "mujoco": 92, "ant": 93, "half": 94, "cheetah": 94, "hopper": 95, "humanoid": [96, 97], "standup": 97, "invert": [98, 99], "pusher": 100, "reacher": 101, "swimmer": 102, "note": 102, "walker2d": 103, "third": 104, "parti": 104, "flappi": 104, "bird": 104, "A": 104, "derk": 104, "gpu": 104, "acceler": 104, "moba": 104, "slimevolleygym": 104, "simpl": 104, "singl": 104, "multi": 104, "agent": [104, 111], "reinforc": [104, 110], "learn": [104, 110, 111, 113], "stabl": 104, "retro": 104, "uniti": 104, "ml": 104, "pge": 104, "parallel": 104, "engin": 104, "gymfc": 104, "flight": 104, "tune": 104, "train": [104, 111], "framework": 104, "gazebo": 104, "goddard": 104, "": 104, "rocket": 104, "problem": 104, "jimini": 104, "pybullet": 104, "drone": 104, "marsexplor": 104, "panda": 104, "robo": 104, "offworld": 104, "osim": 104, "rl": 104, "safe": 104, "racecar_gym": 104, "softrobot": 104, "ostrichrl": 104, "quadrup": 104, "evogym": 104, "igibson": 104, "dexteroushand": 104, "omniisaacgymenv": 104, "spacerobotenv": 104, "line": 104, "follow": 104, "autonom": 104, "drive": 104, "traffic": 104, "carla": 104, "duckietown": 104, "electr": 104, "motor": 104, "highwai": 104, "longicontrol": 104, "sumo": 104, "commonroad": 104, "tmrl": 104, "racing_dream": 104, "l2r": 104, "gym_torc": 104, "recommend": 104, "system": 104, "adserv": 104, "recsi": 104, "virtualtaobao": 104, "industri": 104, "process": 104, "inventori": 104, "openmodelica": 104, "microgrid": 104, "mobil": 104, "pyelastica": 104, "financi": 104, "anytrad": 104, "mtsim": 104, "carl": 104, "compilergym": 104, "dacbench": 104, "autokei": 104, "cellular": 104, "automata": 104, "maze": 104, "riverswim": 104, "sokoban": 104, "math": 104, "prog": 104, "synth": 104, "nasgym": 104, "nlpgym": 104, "toolkit": 104, "develop": 104, "solv": [104, 111], "nlp": 104, "task": 104, "obstacl": 104, "tower": 104, "qasgym": 104, "mo": 104, "satur": 104, "shinrl": 104, "rubikscubegym": 104, "design": 104, "tool": 104, "starship": 104, "land": 104, "raveforc": 104, "gymnax": 104, "toi": 105, "blackjack": [106, 111], "cliff": 107, "walk": 107, "frozen": 108, "lake": 108, "taxi": 109, "i": 110, "standard": 110, "divers": 110, "q": 111, "import": [111, 113], "setup": 111, "execut": 111, "visualis": 111, "polici": 111, "think": 111, "you": 111, "can": 111, "do": 111, "better": 111, "your": 112, "own": 112, "subclass": 112, "declar": 112, "creat": 112, "packag": 112, "instanc": 112, "us": 112, "handl": 113, "solut": 113}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 8, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx": 57}, "alltitles": {"404 - Page Not Found": [[0, "page-not-found"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Gymnasium-docs": [[1, "gymnasium-docs"]], "Instructions for modifying environment pages": [[1, "instructions-for-modifying-environment-pages"]], "Editing an environment page": [[1, "editing-an-environment-page"]], "Adding a new environment": [[1, "adding-a-new-environment"]], "Atari env": [[1, "atari-env"]], "Non-Atari env": [[1, "non-atari-env"]], "Other steps": [[1, "other-steps"]], "Build the Documentation": [[1, "build-the-documentation"]], "Writing Tutorials": [[1, "writing-tutorials"]], "Env": [[2, "env"]], "gymnasium.Env": [[2, "gymnasium-env"]], "Methods": [[2, "methods"], [4, "methods"], [10, "methods"], [11, "methods"]], "Attributes": [[2, "attributes"], [4, "attributes"], [10, "attributes"], [11, "attributes"]], "Additional Methods": [[2, "additional-methods"]], "Implementing environments": [[2, "implementing-environments"]], "Registry": [[3, "registry"]], "Make": [[3, "make"]], "Register": [[3, "register"]], "All registered environments": [[3, "all-registered-environments"]], "Spec": [[3, "spec"]], "Spaces": [[4, "spaces"]], "Fundamental Spaces": [[4, "fundamental-spaces"], [6, "fundamental-spaces"]], "Composite Spaces": [[4, "composite-spaces"], [5, "composite-spaces"]], "Utils": [[4, "utils"], [9, "utils"]], "Vector Utils": [[4, "vector-utils"]], "Dict": [[5, "dict"]], "Tuple": [[5, "tuple"]], "Sequence": [[5, "sequence"]], "Graph": [[5, "graph"]], "Box": [[6, "box"]], "Discrete": [[6, "discrete"]], "MultiBinary": [[6, "multibinary"]], "MultiDiscrete": [[6, "multidiscrete"]], "Text": [[6, "text"]], "Spaces Utils": [[7, "spaces-utils"]], "Spaces Vector Utils": [[8, "spaces-vector-utils"]], "Shared Memory Utils": [[8, "shared-memory-utils"]], "Visualization": [[9, "visualization"]], "Save Rendering Videos": [[9, "save-rendering-videos"]], "Old to New Step API Compatibility": [[9, "old-to-new-step-api-compatibility"]], "Seeding": [[9, "seeding"]], "Environment Checking": [[9, "environment-checking"]], "Vector": [[10, "vector"]], "Gymnasium.vector.VectorEnv": [[10, "gymnasium-vector-vectorenv"]], "Making Vector Environments": [[10, "making-vector-environments"]], "Async Vector Env": [[10, "async-vector-env"]], "Sync Vector Env": [[10, "sync-vector-env"]], "Wrappers": [[11, "wrappers"]], "gymnasium.Wrapper": [[11, "gymnasium-wrapper"]], "Gymnasium Wrappers": [[11, "gymnasium-wrappers"]], "Implementing a custom wrapper": [[11, "implementing-a-custom-wrapper"]], "Action Wrappers": [[12, "action-wrappers"]], "Action Wrapper": [[12, "action-wrapper"]], "Clip Action": [[12, "clip-action"]], "Rescale Action": [[12, "rescale-action"]], "Misc Wrappers": [[13, "misc-wrappers"]], "Atari Preprocessing": [[13, "atari-preprocessing"]], "Autoreset": [[13, "autoreset"]], "Compatibility": [[13, "compatibility"]], "Passive Environment Checker": [[13, "passive-environment-checker"]], "Human Rendering": [[13, "human-rendering"]], "Order Enforcing": [[13, "order-enforcing"]], "Record Episode Statistics": [[13, "record-episode-statistics"]], "Record Video": [[13, "record-video"]], "Render Collection": [[13, "render-collection"]], "Time Limit": [[13, "time-limit"]], "Vector List Info": [[13, "vector-list-info"]], "Observation Wrappers": [[14, "observation-wrappers"]], "Observation Wrapper": [[14, "observation-wrapper"]], "Transform Observation": [[14, "transform-observation"]], "Filter Observation": [[14, "filter-observation"]], "Flatten Observation": [[14, "flatten-observation"]], "Framestack Observations": [[14, "framestack-observations"]], "Gray Scale Observation": [[14, "gray-scale-observation"]], "Normalize Observation": [[14, "normalize-observation"]], "Pixel Observation Wrapper": [[14, "pixel-observation-wrapper"]], "Resize Observation": [[14, "resize-observation"]], "Time Aware Observation": [[14, "time-aware-observation"]], "Reward Wrappers": [[15, "reward-wrappers"]], "Reward Wrapper": [[15, "reward-wrapper"]], "Transform Reward": [[15, "transform-reward"]], "Normalize Reward": [[15, "normalize-reward"]], "Basic Usage": [[16, "basic-usage"]], "Initializing Environments": [[16, "initializing-environments"]], "Interacting with the Environment": [[16, "interacting-with-the-environment"]], "Explaining the code": [[16, "explaining-the-code"]], "Action and observation spaces": [[16, "action-and-observation-spaces"]], "Modifying the environment": [[16, "modifying-the-environment"]], "More information": [[16, "more-information"]], "Compatibility with Gym": [[17, "compatibility-with-gym"]], "Loading OpenAI Gym environments": [[17, "loading-openai-gym-environments"]], "Gym v0.22 Environment Compatibility": [[17, "gym-v0-22-environment-compatibility"]], "Step API Compatibility": [[17, "step-api-compatibility"]], "v21 to v26 Migration Guide": [[18, "v21-to-v26-migration-guide"]], "Example code for v21": [[18, "example-code-for-v21"]], "Example code for v26": [[18, "example-code-for-v26"]], "Seed and random number generator": [[18, "seed-and-random-number-generator"]], "Environment Reset": [[18, "environment-reset"]], "Environment Step": [[18, "environment-step"]], "Environment Render": [[18, "environment-render"]], "Removed code": [[18, "removed-code"]], "Atari": [[19, "atari"]], "AutoROM (installing the ROMs)": [[19, "autorom-installing-the-roms"]], "Action Space": [[19, "action-space"], [45, "action-space"], [46, "action-space"], [47, "action-space"], [48, "action-space"], [49, "action-space"], [83, "action-space"], [84, "action-space"], [85, "action-space"], [87, "action-space"], [88, "action-space"], [89, "action-space"], [90, "action-space"], [91, "action-space"], [93, "action-space"], [94, "action-space"], [95, "action-space"], [96, "action-space"], [97, "action-space"], [98, "action-space"], [99, "action-space"], [100, "action-space"], [101, "action-space"], [102, "action-space"], [103, "action-space"], [106, "action-space"], [108, "action-space"]], "Observation Space": [[19, "observation-space"], [83, "observation-space"], [84, "observation-space"], [85, "observation-space"], [87, "observation-space"], [88, "observation-space"], [89, "observation-space"], [90, "observation-space"], [91, "observation-space"], [93, "observation-space"], [94, "observation-space"], [95, "observation-space"], [96, "observation-space"], [97, "observation-space"], [98, "observation-space"], [99, "observation-space"], [100, "observation-space"], [101, "observation-space"], [102, "observation-space"], [103, "observation-space"], [106, "observation-space"], [108, "observation-space"]], "Rewards": [[19, "rewards"], [22, "rewards"], [23, "rewards"], [25, "rewards"], [26, "rewards"], [27, "rewards"], [28, "rewards"], [29, "rewards"], [30, "rewards"], [31, "rewards"], [32, "rewards"], [33, "rewards"], [34, "rewards"], [35, "rewards"], [36, "rewards"], [37, "rewards"], [39, "rewards"], [40, "rewards"], [41, "rewards"], [42, "rewards"], [43, "rewards"], [44, "rewards"], [45, "rewards"], [46, "rewards"], [47, "rewards"], [48, "rewards"], [49, "rewards"], [50, "rewards"], [51, "rewards"], [52, "rewards"], [53, "rewards"], [54, "rewards"], [55, "rewards"], [61, "rewards"], [62, "rewards"], [63, "rewards"], [64, "rewards"], [65, "rewards"], [66, "rewards"], [67, "rewards"], [68, "rewards"], [69, "rewards"], [70, "rewards"], [71, "rewards"], [72, "rewards"], [73, "rewards"], [74, "rewards"], [75, "rewards"], [83, "rewards"], [84, "rewards"], [85, "rewards"], [87, "rewards"], [88, "rewards"], [91, "rewards"], [93, "rewards"], [94, "rewards"], [95, "rewards"], [96, "rewards"], [97, "rewards"], [98, "rewards"], [99, "rewards"], [100, "rewards"], [101, "rewards"], [102, "rewards"], [103, "rewards"], [106, "rewards"], [108, "rewards"], [109, "rewards"]], "Stochasticity": [[19, "stochasticity"]], "Common Arguments": [[19, "common-arguments"]], "Version History and Naming Schemes": [[19, "version-history-and-naming-schemes"]], "Flavors": [[19, "flavors"]], "References": [[19, "references"], [84, "references"], [87, "references"]], "Adventure": [[20, "adventure"]], "Description": [[20, "description"], [21, "description"], [22, "description"], [23, "description"], [24, "description"], [25, "description"], [26, "description"], [27, "description"], [28, "description"], [29, "description"], [30, "description"], [31, "description"], [32, "description"], [33, "description"], [34, "description"], [35, "description"], [36, "description"], [37, "description"], [39, "description"], [40, "description"], [41, "description"], [42, "description"], [43, "description"], [44, "description"], [45, "description"], [46, "description"], [47, "description"], [48, "description"], [49, "description"], [50, "description"], [51, "description"], [52, "description"], [53, "description"], [54, "description"], [55, "description"], [56, "description"], [57, "description"], [58, "description"], [59, "description"], [60, "description"], [61, "description"], [62, "description"], [63, "description"], [64, "description"], [65, "description"], [66, "description"], [67, "description"], [68, "description"], [69, "description"], [70, "description"], [71, "description"], [72, "description"], [73, "description"], [74, "description"], [75, "description"], [76, "description"], [77, "description"], [78, "description"], [79, "description"], [80, "description"], [81, "description"], [83, "description"], [84, "description"], [85, "description"], [87, "description"], [88, "description"], [89, "description"], [90, "description"], [91, "description"], [93, "description"], [94, "description"], [95, "description"], [96, "description"], [97, "description"], [98, "description"], [99, "description"], [100, "description"], [101, "description"], [102, "description"], [103, "description"], [106, "description"], [107, "description"], [109, "description"]], "Actions": [[20, "actions"], [21, "actions"], [22, "actions"], [23, "actions"], [24, "actions"], [25, "actions"], [26, "actions"], [27, "actions"], [28, "actions"], [29, "actions"], [30, "actions"], [31, "actions"], [32, "actions"], [33, "actions"], [34, "actions"], [35, "actions"], [36, "actions"], [37, "actions"], [39, "actions"], [40, "actions"], [41, "actions"], [42, "actions"], [43, "actions"], [44, "actions"], [50, "actions"], [51, "actions"], [52, "actions"], [53, "actions"], [54, "actions"], [55, "actions"], [56, "actions"], [57, "actions"], [58, "actions"], [59, "actions"], [60, "actions"], [61, "actions"], [62, "actions"], [63, "actions"], [64, "actions"], [65, "actions"], [66, "actions"], [67, "actions"], [68, "actions"], [69, "actions"], [70, "actions"], [71, "actions"], [72, "actions"], [73, "actions"], [74, "actions"], [75, "actions"], [76, "actions"], [77, "actions"], [78, "actions"], [79, "actions"], [80, "actions"], [81, "actions"], [107, "actions"], [109, "actions"]], "Observations": [[20, "observations"], [21, "observations"], [22, "observations"], [23, "observations"], [24, "observations"], [25, "observations"], [26, "observations"], [27, "observations"], [28, "observations"], [29, "observations"], [30, "observations"], [31, "observations"], [32, "observations"], [33, "observations"], [34, "observations"], [35, "observations"], [36, "observations"], [37, "observations"], [39, "observations"], [40, "observations"], [41, "observations"], [42, "observations"], [43, "observations"], [44, "observations"], [45, "observations"], [46, "observations"], [47, "observations"], [48, "observations"], [49, "observations"], [50, "observations"], [51, "observations"], [52, "observations"], [53, "observations"], [54, "observations"], [55, "observations"], [56, "observations"], [57, "observations"], [58, "observations"], [59, "observations"], [60, "observations"], [61, "observations"], [62, "observations"], [63, "observations"], [64, "observations"], [65, "observations"], [66, "observations"], [67, "observations"], [68, "observations"], [69, "observations"], [70, "observations"], [71, "observations"], [72, "observations"], [73, "observations"], [74, "observations"], [75, "observations"], [76, "observations"], [77, "observations"], [78, "observations"], [79, "observations"], [80, "observations"], [81, "observations"], [107, "observations"], [109, "observations"]], "Arguments": [[20, "arguments"], [21, "arguments"], [22, "arguments"], [23, "arguments"], [24, "arguments"], [25, "arguments"], [26, "arguments"], [27, "arguments"], [28, "arguments"], [29, "arguments"], [30, "arguments"], [31, "arguments"], [32, "arguments"], [33, "arguments"], [34, "arguments"], [35, "arguments"], [36, "arguments"], [37, "arguments"], [39, "arguments"], [40, "arguments"], [41, "arguments"], [42, "arguments"], [43, "arguments"], [44, "arguments"], [45, "arguments"], [46, "arguments"], [47, "arguments"], [48, "arguments"], [49, "arguments"], [50, "arguments"], [51, "arguments"], [52, "arguments"], [53, "arguments"], [54, "arguments"], [55, "arguments"], [56, "arguments"], [57, "arguments"], [58, "arguments"], [59, "arguments"], [60, "arguments"], [61, "arguments"], [62, "arguments"], [63, "arguments"], [64, "arguments"], [65, "arguments"], [66, "arguments"], [67, "arguments"], [68, "arguments"], [69, "arguments"], [70, "arguments"], [71, "arguments"], [72, "arguments"], [73, "arguments"], [74, "arguments"], [75, "arguments"], [76, "arguments"], [77, "arguments"], [78, "arguments"], [79, "arguments"], [80, "arguments"], [81, "arguments"], [83, "arguments"], [84, "arguments"], [85, "arguments"], [87, "arguments"], [88, "arguments"], [89, "arguments"], [90, "arguments"], [91, "arguments"], [93, "arguments"], [94, "arguments"], [95, "arguments"], [96, "arguments"], [97, "arguments"], [98, "arguments"], [99, "arguments"], [100, "arguments"], [101, "arguments"], [102, "arguments"], [103, "arguments"], [106, "arguments"], [107, "arguments"], [108, "arguments"], [109, "arguments"]], "Version History": [[20, "version-history"], [21, "version-history"], [22, "version-history"], [23, "version-history"], [24, "version-history"], [25, "version-history"], [26, "version-history"], [27, "version-history"], [28, "version-history"], [29, "version-history"], [30, "version-history"], [31, "version-history"], [32, "version-history"], [33, "version-history"], [34, "version-history"], [35, "version-history"], [36, "version-history"], [37, "version-history"], [39, "version-history"], [40, "version-history"], [41, "version-history"], [42, "version-history"], [43, "version-history"], [44, "version-history"], [45, "version-history"], [46, "version-history"], [47, "version-history"], [48, "version-history"], [49, "version-history"], [50, "version-history"], [51, "version-history"], [52, "version-history"], [53, "version-history"], [54, "version-history"], [55, "version-history"], [56, "version-history"], [57, "version-history"], [58, "version-history"], [59, "version-history"], [60, "version-history"], [61, "version-history"], [62, "version-history"], [63, "version-history"], [64, "version-history"], [65, "version-history"], [66, "version-history"], [67, "version-history"], [68, "version-history"], [69, "version-history"], [70, "version-history"], [71, "version-history"], [72, "version-history"], [73, "version-history"], [74, "version-history"], [75, "version-history"], [76, "version-history"], [77, "version-history"], [78, "version-history"], [79, "version-history"], [80, "version-history"], [81, "version-history"], [83, "version-history"], [84, "version-history"], [85, "version-history"], [87, "version-history"], [89, "version-history"], [90, "version-history"], [91, "version-history"], [93, "version-history"], [94, "version-history"], [95, "version-history"], [96, "version-history"], [97, "version-history"], [98, "version-history"], [99, "version-history"], [100, "version-history"], [101, "version-history"], [102, "version-history"], [103, "version-history"], [106, "version-history"], [107, "version-history"], [108, "version-history"], [109, "version-history"]], "Air Raid": [[21, "air-raid"]], "Alien": [[22, "alien"]], "Amidar": [[23, "amidar"]], "Assault": [[24, "assault"]], "Asterix": [[25, "asterix"]], "Asteroids": [[26, "asteroids"]], "Atlantis": [[27, "atlantis"]], "Bank Heist": [[28, "bank-heist"]], "Battle Zone": [[29, "battle-zone"]], "Beam Rider": [[30, "beam-rider"]], "Berzerk": [[31, "berzerk"]], "Bowling": [[32, "bowling"]], "Boxing": [[33, "boxing"]], "Breakout": [[34, "breakout"]], "Carnival": [[35, "carnival"]], "Centipede": [[36, "centipede"]], "Chopper Command": [[37, "chopper-command"]], "Complete List - Atari": [[38, "complete-list-atari"]], "Crazy Climber": [[39, "crazy-climber"]], "Defender": [[40, "defender"]], "Demon Attack": [[41, "demon-attack"]], "Double Dunk": [[42, "double-dunk"]], "Elevator Action": [[43, "elevator-action"]], "Enduro": [[44, "enduro"]], "FishingDerby": [[45, "fishingderby"]], "Freeway": [[46, "freeway"]], "Frostbite": [[47, "frostbite"]], "Gopher": [[48, "gopher"]], "Gravitar": [[49, "gravitar"]], "Hero": [[50, "hero"]], "IceHockey": [[51, "icehockey"]], "Jamesbond": [[52, "jamesbond"]], "JourneyEscape": [[53, "journeyescape"]], "Kangaroo": [[54, "kangaroo"]], "Krull": [[55, "krull"]], "Kung Fu Master": [[56, "kung-fu-master"]], "Montezuma Revenge": [[57, "montezuma-revenge"]], "Ms Pacman": [[58, "ms-pacman"]], "Name This Game": [[59, "name-this-game"]], "Phoenix": [[60, "phoenix"]], "Pitfall": [[61, "pitfall"]], "Pong": [[62, "pong"]], "Pooyan": [[63, "pooyan"]], "PrivateEye": [[64, "privateeye"]], "Qbert": [[65, "qbert"]], "Riverraid": [[66, "riverraid"]], "Road Runner": [[67, "road-runner"]], "Robot Tank": [[68, "robot-tank"]], "Seaquest": [[69, "seaquest"]], "Skiings": [[70, "skiings"]], "Solaris": [[71, "solaris"]], "SpaceInvaders": [[72, "spaceinvaders"]], "StarGunner": [[73, "stargunner"]], "Tennis": [[74, "tennis"]], "TimePilot": [[75, "timepilot"]], "Tutankham": [[76, "tutankham"]], "Up n\u2019 Down": [[77, "up-n-down"]], "Venture": [[78, "venture"]], "Video Pinball": [[79, "video-pinball"]], "Wizard of Wor": [[80, "wizard-of-wor"]], "Zaxxon": [[81, "zaxxon"]], "Box2D": [[82, "box2d"]], "Bipedal Walker": [[83, "bipedal-walker"]], "Starting State": [[83, "starting-state"], [84, "starting-state"], [85, "starting-state"], [87, "starting-state"], [88, "starting-state"], [89, "starting-state"], [90, "starting-state"], [91, "starting-state"], [93, "starting-state"], [94, "starting-state"], [95, "starting-state"], [96, "starting-state"], [97, "starting-state"], [98, "starting-state"], [99, "starting-state"], [100, "starting-state"], [101, "starting-state"], [102, "starting-state"], [103, "starting-state"]], "Episode Termination": [[83, "episode-termination"], [84, "episode-termination"], [85, "episode-termination"]], "Credits": [[83, "credits"], [84, "credits"], [85, "credits"]], "Car Racing": [[84, "car-racing"]], "Reset Arguments": [[84, "reset-arguments"]], "Lunar Lander": [[85, "lunar-lander"]], "Classic Control": [[86, "classic-control"]], "Acrobot": [[87, "acrobot"]], "Episode End": [[87, "episode-end"], [88, "episode-end"], [89, "episode-end"], [90, "episode-end"], [93, "episode-end"], [94, "episode-end"], [95, "episode-end"], [96, "episode-end"], [97, "episode-end"], [98, "episode-end"], [99, "episode-end"], [100, "episode-end"], [101, "episode-end"], [102, "episode-end"], [103, "episode-end"]], "Cart Pole": [[88, "cart-pole"]], "Mountain Car": [[89, "mountain-car"]], "Transition Dynamics:": [[89, "transition-dynamics"], [90, "transition-dynamics"]], "Reward:": [[89, "reward"]], "Mountain Car Continuous": [[90, "mountain-car-continuous"]], "Reward": [[90, "reward"], [107, "reward"]], "Pendulum": [[91, "pendulum"]], "Episode Truncation": [[91, "episode-truncation"]], "MuJoCo": [[92, "mujoco"]], "Ant": [[93, "ant"]], "Half Cheetah": [[94, "half-cheetah"]], "Hopper": [[95, "hopper"]], "Humanoid": [[96, "humanoid"]], "Humanoid Standup": [[97, "humanoid-standup"]], "Inverted Double Pendulum": [[98, "inverted-double-pendulum"]], "Inverted Pendulum": [[99, "inverted-pendulum"]], "Pusher": [[100, "pusher"]], "Reacher": [[101, "reacher"]], "Swimmer": [[102, "swimmer"]], "Notes": [[102, "notes"]], "Walker2D": [[103, "walker2d"]], "Third-Party Environments": [[104, "third-party-environments"]], "Video Game Environments": [[104, "video-game-environments"]], " flappy-bird-gym: A Flappy Bird environment for Gym": [[104, "flappy-bird-gym-a-flappy-bird-environment-for-gym"]], " gym-derk: GPU accelerated MOBA environment": [[104, "gym-derk-gpu-accelerated-moba-environment"]], " SlimeVolleyGym: A simple environment for single and multi-agent reinforcement learning": [[104, "slimevolleygym-a-simple-environment-for-single-and-multi-agent-reinforcement-learning"]], " stable-retro": [[104, "stable-retro"]], " Unity ML Agents": [[104, "unity-ml-agents"]], " gym-games": [[104, "gym-games"]], " PGE: Parallel Game Engine": [[104, "pge-parallel-game-engine"]], "Robotics Environments": [[104, "robotics-environments"]], "GymFC: A flight control tuning and training framework": [[104, "gymfc-a-flight-control-tuning-and-training-framework"]], "gym-gazebo": [[104, "gym-gazebo"]], "gym-goddard: Goddard\u2019s Rocket Problem": [[104, "gym-goddard-goddard-s-rocket-problem"]], "gym-jiminy: training Robots in Jiminy": [[104, "gym-jiminy-training-robots-in-jiminy"]], "gym-pybullet-drones": [[104, "gym-pybullet-drones"]], "MarsExplorer": [[104, "marsexplorer"]], "panda-gym ": [[104, "panda-gym"]], "robo-gym": [[104, "robo-gym"]], "Offworld-gym": [[104, "offworld-gym"]], "osim-rl": [[104, "osim-rl"]], "safe-control-gym": [[104, "safe-control-gym"]], "racecar_gym": [[104, "racecar-gym"]], "jiminy": [[104, "jiminy"]], "gym-softrobot": [[104, "gym-softrobot"]], "ostrichrl": [[104, "ostrichrl"]], "quadruped-gym": [[104, "quadruped-gym"]], "evogym": [[104, "evogym"]], "iGibson": [[104, "igibson"]], "DexterousHands": [[104, "dexteroushands"]], "OmniIsaacGymEnvs": [[104, "omniisaacgymenvs"]], "SpaceRobotEnv": [[104, "spacerobotenv"]], "gym-line-follower": [[104, "gym-line-follower"]], "Autonomous Driving and Traffic Control Environments": [[104, "autonomous-driving-and-traffic-control-environments"]], " gym-carla": [[104, "gym-carla"]], " gym-duckietown": [[104, "gym-duckietown"]], " gym-electric-motor": [[104, "gym-electric-motor"]], " highway-env": [[104, "highway-env"]], " LongiControl": [[104, "longicontrol"]], " sumo-rl": [[104, "sumo-rl"]], " CommonRoad-RL": [[104, "commonroad-rl"]], "tmrl": [[104, "tmrl"]], "racing_dreamer": [[104, "racing-dreamer"]], "l2r": [[104, "l2r"]], "gym_torcs": [[104, "gym-torcs"]], "Recommendation System Environments": [[104, "recommendation-system-environments"]], " gym-adserve": [[104, "gym-adserve"]], " gym-recsys": [[104, "gym-recsys"]], " VirtualTaobao": [[104, "virtualtaobao"]], "Industrial Process Environments": [[104, "industrial-process-environments"]], " gym-inventory": [[104, "gym-inventory"]], " openmodelica-microgrid-gym": [[104, "openmodelica-microgrid-gym"]], "mobile-env": [[104, "mobile-env"]], "PyElastica": [[104, "pyelastica"]], "Financial Environments": [[104, "financial-environments"]], " gym-anytrading": [[104, "gym-anytrading"]], " gym-mtsim": [[104, "gym-mtsim"]], "Other Environments": [[104, "other-environments"]], " CARL": [[104, "carl"]], " CompilerGym": [[104, "compilergym"]], " DACBench": [[104, "dacbench"]], " gym-autokey": [[104, "gym-autokey"]], " gym-cellular-automata": [[104, "gym-cellular-automata"]], " gym-maze": [[104, "gym-maze"]], " gym-riverswim": [[104, "gym-riverswim"]], " gym-sokoban": [[104, "gym-sokoban"]], " math-prog-synth-env": [[104, "math-prog-synth-env"]], " NASGym": [[104, "nasgym"]], " NLPGym: A toolkit to develop RL agents to solve NLP tasks": [[104, "nlpgym-a-toolkit-to-develop-rl-agents-to-solve-nlp-tasks"]], " Obstacle Tower": [[104, "obstacle-tower"]], " QASGym": [[104, "qasgym"]], " mo-gym": [[104, "mo-gym"]], "gym-saturation": [[104, "gym-saturation"]], "ShinRL": [[104, "shinrl"]], "racing-rl": [[104, "racing-rl"]], " RubiksCubeGym": [[104, "rubikscubegym"]], "evogym-design-tool": [[104, "evogym-design-tool"]], "starship-landing-gym": [[104, "starship-landing-gym"]], "RaveForce": [[104, "raveforce"]], "gymnax": [[104, "gymnax"]], "Toy Text": [[105, "toy-text"]], "Blackjack": [[106, "blackjack"]], "Cliff Walking": [[107, "cliff-walking"]], "Frozen Lake": [[108, "frozen-lake"]], "Taxi": [[109, "taxi"]], "Info": [[109, "info"]], "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments": [[110, "gymnasium-is-a-standard-api-for-reinforcement-learning-and-a-diverse-collection-of-reference-environments"]], "Solving Blackjack with Q-Learning": [[111, "solving-blackjack-with-q-learning"]], "Imports and Environment Setup": [[111, "imports-and-environment-setup"]], "Observing the environment": [[111, "observing-the-environment"]], "Executing an action": [[111, "executing-an-action"]], "Building an agent": [[111, "building-an-agent"]], "Visualizing the training": [[111, "visualizing-the-training"]], "Visualising the policy": [[111, "visualising-the-policy"]], "Think you can do better?": [[111, "think-you-can-do-better"]], "Make your own custom environment": [[112, "make-your-own-custom-environment"]], "Subclassing gymnasium.Env": [[112, "subclassing-gymnasium-env"]], "Declaration and Initialization": [[112, "declaration-and-initialization"]], "Registering Envs": [[112, "registering-envs"]], "Creating a Package": [[112, "creating-a-package"]], "Creating Environment Instances": [[112, "creating-environment-instances"]], "Using Wrappers": [[112, "using-wrappers"]], "Handling Time Limits": [[113, "handling-time-limits"]], "Termination": [[113, "termination"]], "Truncation": [[113, "truncation"]], "Importance in learning code": [[113, "importance-in-learning-code"]], "Solution": [[113, "solution"]]}, "indexentries": {"env (class in gymnasium)": [[2, "gymnasium.Env"]], "action_space (gymnasium.env attribute)": [[2, "gymnasium.Env.action_space"]], "close() (in module gymnasium.env)": [[2, "gymnasium.Env.close"]], "metadata (gymnasium.env attribute)": [[2, "gymnasium.Env.metadata"]], "np_random (gymnasium.env property)": [[2, "gymnasium.Env.np_random"]], "observation_space (gymnasium.env attribute)": [[2, "gymnasium.Env.observation_space"]], "render() (in module gymnasium.env)": [[2, "gymnasium.Env.render"]], "render_mode (gymnasium.env attribute)": [[2, "gymnasium.Env.render_mode"]], "reset() (in module gymnasium.env)": [[2, "gymnasium.Env.reset"]], "reward_range (gymnasium.env attribute)": [[2, "gymnasium.Env.reward_range"]], "spec (gymnasium.env attribute)": [[2, "gymnasium.Env.spec"]], "step() (in module gymnasium.env)": [[2, "gymnasium.Env.step"]], "unwrapped (gymnasium.env property)": [[2, "gymnasium.Env.unwrapped"]], "make() (in module gymnasium)": [[3, "gymnasium.make"]], "register() (in module gymnasium)": [[3, "gymnasium.register"]], "spec() (in module gymnasium)": [[3, "gymnasium.spec"]], "space (class in gymnasium.spaces)": [[4, "gymnasium.spaces.Space"]], "contains() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.contains"]], "dtype (space property)": [[4, "Space.dtype"]], "from_jsonable() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.from_jsonable"]], "sample() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.sample"]], "seed() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.seed"]], "shape (gymnasium.spaces.space.space property)": [[4, "gymnasium.spaces.space.Space.shape"]], "to_jsonable() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.to_jsonable"]], "dict (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Dict"]], "graph (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Graph"]], "sequence (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Sequence"]], "tuple (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Tuple"]], "sample() (gymnasium.spaces.dict method)": [[5, "gymnasium.spaces.Dict.sample"]], "sample() (gymnasium.spaces.graph method)": [[5, "gymnasium.spaces.Graph.sample"]], "sample() (gymnasium.spaces.sequence method)": [[5, "gymnasium.spaces.Sequence.sample"]], "sample() (gymnasium.spaces.tuple method)": [[5, "gymnasium.spaces.Tuple.sample"]], "seed() (gymnasium.spaces.dict method)": [[5, "gymnasium.spaces.Dict.seed"]], "seed() (gymnasium.spaces.graph method)": [[5, "gymnasium.spaces.Graph.seed"]], "seed() (gymnasium.spaces.sequence method)": [[5, "gymnasium.spaces.Sequence.seed"]], "seed() (gymnasium.spaces.tuple method)": [[5, "gymnasium.spaces.Tuple.seed"]], "box (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Box"]], "discrete (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Discrete"]], "multibinary (class in gymnasium.spaces)": [[6, "gymnasium.spaces.MultiBinary"]], "multidiscrete (class in gymnasium.spaces)": [[6, "gymnasium.spaces.MultiDiscrete"]], "text (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Text"]], "is_bounded() (gymnasium.spaces.box method)": [[6, "gymnasium.spaces.Box.is_bounded"]], "sample() (gymnasium.spaces.box method)": [[6, "gymnasium.spaces.Box.sample"]], "sample() (gymnasium.spaces.discrete method)": [[6, "gymnasium.spaces.Discrete.sample"]], "sample() (gymnasium.spaces.multibinary method)": [[6, "gymnasium.spaces.MultiBinary.sample"]], "sample() (gymnasium.spaces.multidiscrete method)": [[6, "gymnasium.spaces.MultiDiscrete.sample"]], "sample() (gymnasium.spaces.text method)": [[6, "gymnasium.spaces.Text.sample"]], "seed() (gymnasium.spaces.box method)": [[6, "gymnasium.spaces.Box.seed"]], "seed() (gymnasium.spaces.discrete method)": [[6, "gymnasium.spaces.Discrete.seed"]], "seed() (gymnasium.spaces.multibinary method)": [[6, "gymnasium.spaces.MultiBinary.seed"]], "seed() (gymnasium.spaces.multidiscrete method)": [[6, "gymnasium.spaces.MultiDiscrete.seed"]], "seed() (gymnasium.spaces.text method)": [[6, "gymnasium.spaces.Text.seed"]], "flatdim() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.flatdim"]], "flatten() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.flatten"]], "flatten_space() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.flatten_space"]], "unflatten() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.unflatten"]], "batch_space() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.batch_space"]], "concatenate() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.concatenate"]], "create_empty_array() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.create_empty_array"]], "create_shared_memory() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.create_shared_memory"]], "iterate() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.iterate"]], "read_from_shared_memory() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.read_from_shared_memory"]], "write_to_shared_memory() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.write_to_shared_memory"]], "playplot (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayPlot"]], "playablegame (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayableGame"]], "callback() (gymnasium.utils.play.playplot method)": [[9, "gymnasium.utils.play.PlayPlot.callback"]], "capped_cubic_video_schedule() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.capped_cubic_video_schedule"]], "check_env() (in module gymnasium.utils.env_checker)": [[9, "gymnasium.utils.env_checker.check_env"]], "convert_to_done_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_done_step_api"]], "convert_to_terminated_truncated_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_terminated_truncated_step_api"]], "np_random() (in module gymnasium.utils.seeding)": [[9, "gymnasium.utils.seeding.np_random"]], "play() (in module gymnasium.utils.play)": [[9, "gymnasium.utils.play.play"]], "process_event() (gymnasium.utils.play.playablegame method)": [[9, "gymnasium.utils.play.PlayableGame.process_event"]], "save_video() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.save_video"]], "step_api_compatibility() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.step_api_compatibility"]], "asyncvectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.AsyncVectorEnv"]], "syncvectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.SyncVectorEnv"]], "vectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.VectorEnv"]], "action_space": [[10, "action_space"]], "close() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.close"]], "make() (in module gymnasium.vector)": [[10, "gymnasium.vector.make"]], "observation_space": [[10, "observation_space"]], "reset() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.reset"]], "single_action_space": [[10, "single_action_space"]], "single_observation_space": [[10, "single_observation_space"]], "step() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.step"]], "wrapper (class in gymnasium)": [[11, "gymnasium.Wrapper"]], "action_space (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.action_space"]], "close() (in module gymnasium.wrapper)": [[11, "gymnasium.Wrapper.close"]], "metadata (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.metadata"]], "np_random (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.np_random"]], "observation_space (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.observation_space"]], "reset() (in module gymnasium.wrapper)": [[11, "gymnasium.Wrapper.reset"]], "reward_range (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.reward_range"]], "spec (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.spec"]], "step() (in module gymnasium.wrapper)": [[11, "gymnasium.Wrapper.step"]], "unwrapped (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.unwrapped"]], "actionwrapper (class in gymnasium)": [[12, "gymnasium.ActionWrapper"]], "actionwrapper.action() (in module gymnasium.actionwrapper)": [[12, "gymnasium.ActionWrapper.ActionWrapper.action"]], "clipaction (class in gymnasium.wrappers)": [[12, "gymnasium.wrappers.ClipAction"]], "rescaleaction (class in gymnasium.wrappers)": [[12, "gymnasium.wrappers.RescaleAction"]], "ataripreprocessing (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.AtariPreprocessing"]], "autoresetwrapper (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.AutoResetWrapper"]], "envcompatibility (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.EnvCompatibility"]], "humanrendering (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.HumanRendering"]], "orderenforcing (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.OrderEnforcing"]], "passiveenvchecker (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.PassiveEnvChecker"]], "recordepisodestatistics (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.RecordEpisodeStatistics"]], "recordvideo (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.RecordVideo"]], "rendercollection (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.RenderCollection"]], "stepapicompatibility (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.StepAPICompatibility"]], "timelimit (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.TimeLimit"]], "vectorlistinfo (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.VectorListInfo"]], "filterobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.FilterObservation"]], "flattenobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.FlattenObservation"]], "framestack (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.FrameStack"]], "grayscaleobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.GrayScaleObservation"]], "normalizeobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.NormalizeObservation"]], "observationwrapper (class in gymnasium)": [[14, "gymnasium.ObservationWrapper"]], "pixelobservationwrapper (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.PixelObservationWrapper"]], "resizeobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.ResizeObservation"]], "timeawareobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.TimeAwareObservation"]], "transformobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.TransformObservation"]], "observation() (in module gymnasium.observationwrapper)": [[14, "gymnasium.ObservationWrapper.observation"]], "normalizereward (class in gymnasium.wrappers)": [[15, "gymnasium.wrappers.NormalizeReward"]], "rewardwrapper (class in gymnasium)": [[15, "gymnasium.RewardWrapper"]], "rewardwrapper.reward() (in module gymnasium.rewardwrapper)": [[15, "gymnasium.RewardWrapper.RewardWrapper.reward"]], "transformreward (class in gymnasium.wrappers)": [[15, "gymnasium.wrappers.TransformReward"]]}}) |