Search.setIndex({"docnames": ["404", "README", "api/env", "api/registry", "api/spaces", "api/spaces/composite", "api/spaces/fundamental", "api/spaces/utils", "api/spaces/vector_utils", "api/utils", "api/vector", "api/wrappers", "api/wrappers/action_wrappers", "api/wrappers/misc_wrappers", "api/wrappers/observation_wrappers", "api/wrappers/reward_wrappers", "content/basic_usage", "content/environment_creation", "content/handling_timelimits", "content/vectorising", "environments/atari", "environments/atari/adventure", "environments/atari/air_raid", "environments/atari/alien", "environments/atari/amidar", "environments/atari/assault", "environments/atari/asterix", "environments/atari/asteroids", "environments/atari/atlantis", "environments/atari/bank_heist", "environments/atari/battle_zone", "environments/atari/beam_rider", "environments/atari/berzerk", "environments/atari/bowling", "environments/atari/boxing", "environments/atari/breakout", "environments/atari/carnival", "environments/atari/centipede", "environments/atari/chopper_command", "environments/atari/complete_list", "environments/atari/crazy_climber", "environments/atari/defender", "environments/atari/demon_attack", "environments/atari/double_dunk", "environments/atari/elevator_action", "environments/atari/enduro", "environments/atari/fishing_derby", "environments/atari/freeway", "environments/atari/frostbite", "environments/atari/gopher", "environments/atari/gravitar", "environments/atari/hero", "environments/atari/ice_hockey", "environments/atari/jamesbond", "environments/atari/journey_escape", "environments/atari/kangaroo", "environments/atari/krull", "environments/atari/kung_fu_master", "environments/atari/montezuma_revenge", "environments/atari/ms_pacman", "environments/atari/name_this_game", "environments/atari/phoenix", "environments/atari/pitfall", "environments/atari/pong", "environments/atari/pooyan", "environments/atari/private_eye", "environments/atari/qbert", "environments/atari/riverraid", "environments/atari/road_runner", "environments/atari/robotank", "environments/atari/seaquest", "environments/atari/skiing", "environments/atari/solaris", "environments/atari/space_invaders", "environments/atari/star_gunner", "environments/atari/tennis", "environments/atari/time_pilot", "environments/atari/tutankham", "environments/atari/up_n_down", "environments/atari/venture", "environments/atari/video_pinball", "environments/atari/wizard_of_wor", "environments/atari/zaxxon", "environments/box2d", "environments/box2d/bipedal_walker", "environments/box2d/car_racing", "environments/box2d/lunar_lander", "environments/classic_control", "environments/classic_control/acrobot", "environments/classic_control/cart_pole", "environments/classic_control/mountain_car", "environments/classic_control/mountain_car_continuous", "environments/classic_control/pendulum", "environments/mujoco", "environments/mujoco/ant", "environments/mujoco/half_cheetah", "environments/mujoco/hopper", "environments/mujoco/humanoid", "environments/mujoco/humanoid_standup", "environments/mujoco/inverted_double_pendulum", "environments/mujoco/inverted_pendulum", "environments/mujoco/pusher", "environments/mujoco/reacher", "environments/mujoco/swimmer", "environments/mujoco/walker2d", "environments/third_party_environments", "environments/toy_text", "environments/toy_text/blackjack", "environments/toy_text/cliff_walking", "environments/toy_text/frozen_lake", "environments/toy_text/taxi", "index"], "filenames": ["404.md", "README.md", "api/env.md", "api/registry.md", "api/spaces.md", "api/spaces/composite.md", "api/spaces/fundamental.md", "api/spaces/utils.md", "api/spaces/vector_utils.md", "api/utils.md", "api/vector.md", "api/wrappers.md", "api/wrappers/action_wrappers.md", "api/wrappers/misc_wrappers.md", "api/wrappers/observation_wrappers.md", "api/wrappers/reward_wrappers.md", "content/basic_usage.md", "content/environment_creation.md", "content/handling_timelimits.md", "content/vectorising.md", "environments/atari.md", "environments/atari/adventure.md", "environments/atari/air_raid.md", "environments/atari/alien.md", "environments/atari/amidar.md", "environments/atari/assault.md", "environments/atari/asterix.md", "environments/atari/asteroids.md", "environments/atari/atlantis.md", "environments/atari/bank_heist.md", "environments/atari/battle_zone.md", "environments/atari/beam_rider.md", "environments/atari/berzerk.md", "environments/atari/bowling.md", "environments/atari/boxing.md", "environments/atari/breakout.md", "environments/atari/carnival.md", "environments/atari/centipede.md", "environments/atari/chopper_command.md", "environments/atari/complete_list.md", "environments/atari/crazy_climber.md", "environments/atari/defender.md", "environments/atari/demon_attack.md", "environments/atari/double_dunk.md", "environments/atari/elevator_action.md", "environments/atari/enduro.md", "environments/atari/fishing_derby.md", "environments/atari/freeway.md", "environments/atari/frostbite.md", "environments/atari/gopher.md", "environments/atari/gravitar.md", "environments/atari/hero.md", "environments/atari/ice_hockey.md", "environments/atari/jamesbond.md", "environments/atari/journey_escape.md", "environments/atari/kangaroo.md", "environments/atari/krull.md", "environments/atari/kung_fu_master.md", "environments/atari/montezuma_revenge.md", "environments/atari/ms_pacman.md", "environments/atari/name_this_game.md", "environments/atari/phoenix.md", "environments/atari/pitfall.md", "environments/atari/pong.md", "environments/atari/pooyan.md", "environments/atari/private_eye.md", "environments/atari/qbert.md", "environments/atari/riverraid.md", "environments/atari/road_runner.md", "environments/atari/robotank.md", "environments/atari/seaquest.md", "environments/atari/skiing.md", "environments/atari/solaris.md", "environments/atari/space_invaders.md", "environments/atari/star_gunner.md", "environments/atari/tennis.md", "environments/atari/time_pilot.md", "environments/atari/tutankham.md", "environments/atari/up_n_down.md", "environments/atari/venture.md", "environments/atari/video_pinball.md", "environments/atari/wizard_of_wor.md", "environments/atari/zaxxon.md", "environments/box2d.md", "environments/box2d/bipedal_walker.md", "environments/box2d/car_racing.md", "environments/box2d/lunar_lander.md", "environments/classic_control.md", "environments/classic_control/acrobot.md", "environments/classic_control/cart_pole.md", "environments/classic_control/mountain_car.md", "environments/classic_control/mountain_car_continuous.md", "environments/classic_control/pendulum.md", "environments/mujoco.md", "environments/mujoco/ant.md", "environments/mujoco/half_cheetah.md", "environments/mujoco/hopper.md", "environments/mujoco/humanoid.md", "environments/mujoco/humanoid_standup.md", "environments/mujoco/inverted_double_pendulum.md", "environments/mujoco/inverted_pendulum.md", "environments/mujoco/pusher.md", "environments/mujoco/reacher.md", "environments/mujoco/swimmer.md", "environments/mujoco/walker2d.md", "environments/third_party_environments.md", "environments/toy_text.md", "environments/toy_text/blackjack.md", "environments/toy_text/cliff_walking.md", "environments/toy_text/frozen_lake.md", "environments/toy_text/taxi.md", "index.md"], "titles": ["404 - Page Not Found", "Gymnasium-docs", "Env", "Registry", "Spaces", "Composite Spaces", "Fundamental Spaces", "Spaces Utils", "Spaces Vector Utils", "Utils", "Vector", "Wrappers", "Action Wrappers", "Misc Wrappers", "Observation Wrappers", "Reward Wrappers", "Basic Usage", "Make your own custom environment", "Handling Time Limits", "Vectorizing your environments", "Atari", "Adventure", "Air Raid", "Alien", "Amidar", "Assault", "Asterix", "Asteroids", "Atlantis", "Bank Heist", "Battle Zone", "Beam Rider", "Berzerk", "Bowling", "Boxing", "Breakout", "Carnival", "Centipede", "Chopper Command", "Complete List - Atari", "Crazy Climber", "Defender", "Demon Attack", "Double Dunk", "Elevator Action", "Enduro", "FishingDerby", "Freeway", "Frostbite", "Gopher", "Gravitar", "Hero", "IceHockey", "Jamesbond", "JourneyEscape", "Kangaroo", "Krull", "Kung Fu Master", "Montezuma Revenge", "Ms Pacman", "Name This Game", "Phoenix", "Pitfall", "Pong", "Pooyan", "PrivateEye", "Qbert", "Riverraid", "Road Runner", "Robot Tank", "Seaquest", "Skiings", "Solaris", "SpaceInvaders", "StarGunner", "Tennis", "TimePilot", "Tutankham", "Up n\u2019 Down", "Venture", "Video Pinball", "Wizard of Wor", "Zaxxon", "Box2D", "Bipedal Walker", "Car Racing", "Lunar Lander", "Classic Control", "Acrobot", "Cart Pole", "Mountain Car", "Mountain Car Continuous", "Pendulum", "MuJoCo", "Ant", "Half Cheetah", "Hopper", "Humanoid", "Humanoid Standup", "Inverted Double Pendulum", "Inverted Pendulum", "Pusher", "Reacher", "Swimmer", "Walker2D", "Third-Party Environments", "Toy Text", "Blackjack", "Cliff Walking", "Frozen Lake", "Taxi", "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments"], "terms": {"thi": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 110], "folder": [1, 9, 13, 101, 102], "contain": [1, 2, 4, 7, 8, 10, 11, 13, 14, 17, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 94, 95, 96, 97, 101, 102, 103, 104, 105, 107, 110], "If": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 26, 29, 34, 37, 46, 47, 48, 49, 50, 64, 71, 75, 84, 85, 86, 91, 94, 96, 97, 98, 102, 104, 107, 108, 109], "you": [1, 2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 94, 97, 98, 101, 102, 105], "ar": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 110], "pleas": [1, 2, 9, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110], "pr": [1, 105], "repo": [1, 20, 105], "otherwis": [1, 2, 3, 5, 6, 9, 10, 13, 14, 19, 20, 33, 105], "follow": [1, 3, 4, 9, 11, 12, 13, 15, 16, 17, 18, 19, 20, 33, 43, 45, 46, 47, 48, 49, 50, 75, 88, 89, 90, 91, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 109], "below": [1, 6, 11, 18, 46, 84, 86, 92, 101, 104], "directli": [1, 5, 11, 13, 16, 17, 19, 88, 105], "markdown": 1, "file": [1, 17, 88, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "repositori": [1, 11, 93, 105], "fork": [1, 105, 111], "docstr": 1, "": [1, 2, 5, 6, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 40, 46, 47, 48, 49, 50, 52, 53, 56, 57, 58, 63, 64, 66, 83, 84, 85, 86, 87, 88, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 109, 110, 111], "python": [1, 3, 8, 13, 17, 84, 85, 86, 105, 106, 111], "Then": [1, 11, 12, 16, 70, 103], "pip": [1, 17, 20, 83, 87, 93], "instal": [1, 9, 13, 17, 28, 83, 87, 93], "your": [1, 2, 10, 11, 12, 13, 14, 15, 16, 23, 24, 26, 28, 29, 31, 33, 34, 35, 37, 43, 45, 46, 47, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 63, 65, 66, 67, 68, 69, 70, 71, 72, 73, 76, 77, 78, 79, 80, 81, 82, 85, 94, 97, 98], "run": [1, 2, 3, 10, 13, 16, 17, 19, 29, 51, 54, 62, 67, 68, 71, 72, 84, 86, 88, 94, 95, 96, 97, 98, 99, 100, 103, 104, 105], "script": 1, "gen_md": 1, "py": [1, 8, 17, 20, 84, 85, 86, 93, 94, 97, 98, 108], "automat": [1, 2, 3, 10, 11, 13, 17, 19, 105], "gener": [1, 2, 4, 5, 6, 9, 10, 11, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 110, 111], "For": [1, 2, 6, 7, 9, 11, 13, 14, 16, 17, 19, 20, 21, 23, 24, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 41, 51, 52, 53, 54, 55, 56, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 85, 86, 109, 110], "add": [1, 3, 9, 10, 14, 16, 17, 85, 93, 97, 98, 105, 110], "complet": [1, 11, 13, 16, 18, 20, 40, 53, 65, 66, 85, 86], "ensur": [1, 2, 3, 5, 7, 9, 16, 17], "i": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 110], "ha": [1, 2, 4, 6, 7, 9, 11, 13, 14, 15, 16, 17, 18, 19, 20, 50, 70, 84, 85, 86, 87, 93, 94, 95, 96, 97, 98, 101, 102, 103, 104, 105, 107, 109], "properli": [1, 4, 19], "format": [1, 4, 9, 11, 13, 14, 16], "md": [1, 17], "correspond": [1, 2, 3, 16, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 86, 88, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 110], "gif": [1, 88], "_static": 1, "video": [1, 11, 39, 69, 84], "env_typ": 1, "where": [1, 3, 5, 6, 7, 9, 11, 13, 14, 16, 17, 18, 19, 20, 43, 85, 88, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 109, 110], "categori": 1, "e": [1, 2, 4, 6, 7, 8, 10, 11, 13, 14, 16, 17, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 101, 102, 105, 107], "g": [1, 2, 4, 6, 7, 8, 10, 11, 16, 17, 19, 71, 88, 92, 105, 109, 110], "mujoco": [1, 11, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "snake_cas": 1, "name": [1, 3, 11, 17, 39, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "convent": [1, 2, 20], "altern": [1, 19, 20, 105], "gen_gif": 1, "index": [1, 8, 9, 13, 14, 16, 20, 89, 98, 108], "toctre": 1, "requir": [1, 2, 4, 14, 16, 19, 93, 105], "packag": [1, 13, 105], "r": [1, 6, 13, 15, 69, 88, 92, 110], "txt": 1, "To": [1, 3, 8, 10, 13, 14, 15, 16, 17, 19, 20, 28, 38, 66, 84, 85, 86, 88, 110], "onc": [1, 13, 17, 27, 37, 44, 51, 99, 102, 110], "cd": [1, 17], "make": [1, 2, 5, 9, 11, 12, 13, 14, 15, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110, 111], "dirhtml": 1, "_build": 1, "rebuild": [1, 28], "everi": [1, 9, 13, 16, 17, 37, 38, 42, 47, 69, 70, 79, 85, 86, 89, 94, 96, 97, 104, 105], "time": [1, 2, 3, 5, 9, 10, 11, 16, 17, 20, 36, 39, 42, 43, 44, 48, 52, 54, 55, 62, 66, 67, 68, 69, 70, 71, 84, 85, 92, 94, 95, 96, 97, 98, 103, 104, 105, 108], "chang": [1, 2, 8, 9, 10, 11, 13, 14, 15, 17, 20, 48, 56, 66, 85, 88, 89, 90, 91, 92, 93, 101, 102, 105, 110], "made": [1, 16, 101, 102], "sphinx": 1, "autobuild": 1, "b": [1, 6, 101, 102, 110], "class": [2, 4, 5, 6, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 93], "The": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110, 111], "main": [2, 19, 86, 96, 104], "reinforc": [2, 4, 18, 19, 88, 103, 106, 107, 108, 110], "learn": [2, 4, 5, 13, 14, 15, 17, 19, 20, 46, 47, 48, 49, 50, 84, 85, 86, 88, 89, 90, 91, 95, 98, 99, 100, 103, 106, 107, 108, 110], "agent": [2, 4, 11, 13, 14, 16, 17, 18, 19, 20, 44, 53, 84, 85, 86, 90, 94, 95, 96, 97, 98, 99, 100, 103, 104, 108, 109, 110], "encapsul": 2, "an": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 101, 102, 103, 104, 105, 107, 108, 110], "arbitrari": [2, 3, 6, 9, 14, 15, 105], "behind": [2, 64], "scene": [2, 64, 105], "dynam": [2, 20, 35, 46, 47, 48, 49, 50, 88, 92, 93, 99, 105], "through": [2, 3, 4, 10, 16, 18, 20, 35, 51, 54, 57, 58, 62, 71, 72, 97, 98, 105], "step": [2, 3, 10, 11, 12, 13, 14, 15, 18, 19, 20, 84, 86, 88, 89, 92, 105, 108, 110, 111], "reset": [2, 3, 9, 10, 11, 12, 13, 14, 15, 16, 19, 88, 89, 90, 91, 92, 105, 110, 111], "function": [2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 86, 92, 102, 105, 109, 110, 111], "can": [2, 3, 4, 5, 6, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 109, 110], "partial": 2, "fulli": [2, 105], "observ": [2, 4, 5, 8, 9, 10, 11, 12, 13, 15, 16, 18, 105, 111], "singl": [2, 4, 5, 6, 7, 8, 9, 10, 14, 17, 19, 96, 97, 98, 104], "multi": [2, 6, 93, 97, 98, 101], "see": [2, 4, 9, 10, 16, 17, 19, 20, 21, 24, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 41, 51, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 86, 88, 94, 95, 96, 97, 103, 104, 105], "pettingzoo": 2, "api": [2, 11, 13, 17, 18, 105], "user": [2, 3, 10, 16, 17, 20, 88, 89, 90, 91, 92, 105, 111], "need": [2, 3, 4, 5, 9, 11, 12, 13, 14, 16, 17, 18, 38, 40, 45, 51, 55, 65, 70, 84, 86, 89, 93], "know": [2, 13, 17], "updat": [2, 9, 13, 14, 17, 18, 110], "action": [2, 3, 4, 5, 6, 9, 10, 11, 13, 16, 17, 39, 87, 105, 106, 111], "return": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104, 105, 108, 110], "next": [2, 8, 40, 42, 44], "reward": [2, 3, 9, 10, 11, 13, 16, 17, 18, 19, 93, 105, 111], "take": [2, 3, 6, 7, 9, 10, 11, 12, 13, 16, 19, 20, 73, 87, 89, 91, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 109, 110], "termin": [2, 3, 9, 10, 11, 13, 15, 16, 17, 19, 88, 89, 90, 91, 94, 96, 97, 98, 99, 100, 101, 102, 104, 108, 111], "truncat": [2, 3, 9, 10, 11, 13, 15, 16, 17, 19, 88, 89, 90, 91, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 111], "due": [2, 18, 109], "latest": 2, "inform": [2, 4, 5, 6, 9, 10, 11, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 110], "from": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 22, 36, 43, 48, 49, 52, 54, 63, 64, 76, 82, 84, 85, 86, 88, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110], "about": [2, 9, 14, 16, 17, 18, 19, 65, 88, 94, 97, 98], "metric": [2, 9], "debug": [2, 4, 9, 106], "info": [2, 9, 10, 11, 14, 15, 16, 17, 18, 19, 94, 95, 96, 97, 101, 102, 103, 104, 111], "initi": [2, 3, 5, 6, 10, 11, 12, 13, 14, 15, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 86, 87, 88, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 110], "state": [2, 11, 13, 14, 16, 18, 20, 87, 93, 105, 106, 108, 110], "befor": [2, 3, 9, 10, 11, 12, 13, 14, 15, 16, 17, 28, 40, 54, 65, 72, 73, 85, 94, 95, 96, 97, 98, 99, 100, 102, 103, 104], "call": [2, 3, 7, 9, 10, 11, 12, 13, 14, 16, 17, 19, 20, 33, 52, 101, 102, 107, 109], "first": [2, 9, 10, 11, 13, 14, 16, 17, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 110], "episod": [2, 3, 9, 11, 14, 16, 17, 18, 19, 108, 110], "render": [2, 10, 11, 14, 16, 20, 83, 84, 94, 95, 96, 97, 98, 99, 100, 103, 104, 105], "help": [2, 4, 16, 23, 55, 58, 101, 105], "visualis": 2, "what": [2, 4, 13, 16, 20, 110], "exampl": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 85, 88, 105, 107, 108, 109], "mode": [2, 10, 11, 13, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "human": [2, 5, 11, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 85, 97, 98, 101, 105, 111], "rgb_arrai": [2, 9, 11, 13, 14, 16, 17, 20], "ansi": [2, 17], "text": [2, 4, 5, 7, 105, 107, 108, 109, 110], "close": [2, 6, 9, 10, 11, 16, 40, 65, 94, 96, 97, 102, 104, 111], "import": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110, 111], "when": [2, 4, 5, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 23, 36, 40, 41, 42, 44, 46, 47, 48, 49, 50, 52, 53, 67, 68, 69, 70, 73, 85, 86, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 108, 110], "extern": [2, 18, 94, 97, 98], "softwar": [2, 105], "us": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 109, 110], "pygam": [2, 9, 16, 17, 83, 105], "databas": 2, "have": [2, 3, 6, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 26, 28, 29, 33, 35, 37, 38, 40, 41, 46, 47, 48, 49, 50, 51, 54, 55, 56, 60, 62, 64, 70, 72, 83, 84, 85, 88, 94, 95, 96, 97, 98, 100, 101, 103, 104, 105, 107, 110], "understand": [2, 7, 10, 101, 105], "action_spac": [2, 9, 10, 11, 12, 14, 15, 16, 17, 19, 110], "space": [2, 9, 10, 11, 12, 13, 14, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 93, 105, 106, 108, 110], "object": [2, 4, 8, 11, 16, 19, 21, 26, 40, 46, 47, 55, 67, 73, 101, 105], "valid": [2, 3, 4, 6, 8, 10, 11, 12, 13, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "all": [2, 5, 6, 10, 11, 13, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 47, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 88, 89, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108], "should": [2, 4, 6, 9, 10, 13, 14, 16, 17, 19, 101, 102], "within": [2, 4, 12, 14, 58, 62, 86, 87, 99, 100, 105], "observation_spac": [2, 5, 6, 10, 11, 14, 16, 17, 19], "reward_rang": [2, 11, 15], "A": [2, 4, 5, 6, 7, 9, 10, 12, 13, 14, 15, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 88, 89, 91, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104, 109], "tupl": [2, 4, 6, 7, 8, 9, 11, 14, 16, 17, 19, 20, 94, 96, 97, 104, 107, 110], "minimum": [2, 6, 92], "maximum": [2, 3, 6, 9, 13, 16, 17, 69, 70, 86, 88, 92, 99, 105], "possibl": [2, 5, 6, 7, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 86, 88, 89, 90, 91, 95, 97, 99, 100, 103, 104, 105, 108, 109, 110], "over": [2, 8, 13, 15, 16, 19, 23, 29, 52, 62, 67, 95, 97, 107, 109], "default": [2, 3, 4, 5, 6, 9, 10, 11, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 85, 88, 92, 94, 95, 96, 97, 101, 102, 103, 104, 105], "rang": [2, 8, 9, 11, 12, 13, 15, 16, 17, 20, 52, 84, 87, 88, 89, 90, 91, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 111], "set": [2, 5, 6, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 78, 79, 80, 81, 83, 86, 87, 88, 90, 91, 93, 94, 95, 96, 97, 101, 102, 103, 104, 105], "infti": [2, 6], "spec": [2, 10, 11, 13], "metadata": [2, 9, 11, 13, 17, 20], "fp": [2, 9, 17, 20], "np_random": [2, 9, 11, 13, 17], "random": [2, 4, 5, 6, 9, 13, 14, 16, 17, 19, 20, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 102, 103, 104, 105, 109, 110], "number": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 14, 16, 17, 19, 20, 22, 23, 24, 25, 26, 27, 28, 31, 32, 33, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 54, 57, 59, 60, 61, 63, 64, 66, 69, 71, 73, 74, 76, 77, 78, 80, 81, 85, 86, 88, 96, 97, 98, 103, 104, 107, 109], "assign": [2, 71, 89, 90, 91, 101, 102], "dure": [2, 5, 6, 10, 11, 13, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 88, 94, 95, 96, 97, 103, 104, 110], "super": [2, 11, 12, 14, 15, 17, 19], "seed": [2, 3, 4, 5, 6, 10, 16, 17, 68, 111], "assess": 2, "self": [2, 4, 5, 11, 12, 13, 14, 15, 17, 19, 91, 105], "modifi": [2, 4, 10, 11, 12, 14, 15, 16, 17, 88, 101, 102, 105, 110], "extend": [2, 105], "wrapper": [2, 3, 5, 6, 9, 10, 19, 101, 102, 105], "acttyp": [2, 9, 11], "obstyp": [2, 9, 11], "float": [2, 3, 7, 9, 11, 12, 14, 15, 17, 19, 20, 51, 64, 86, 94, 95, 96, 97, 103, 104, 105], "bool": [2, 3, 4, 6, 9, 10, 11, 13, 14, 17, 19, 20, 86, 94, 95, 96, 97, 103, 104], "dict": [2, 4, 6, 7, 8, 9, 10, 11, 13, 14, 16, 17, 19], "one": [2, 5, 6, 7, 9, 10, 11, 13, 14, 16, 18, 19, 22, 23, 24, 28, 33, 40, 43, 44, 56, 65, 66, 67, 69, 70, 75, 88, 89, 90, 91, 92, 94, 96, 98, 99, 100, 102, 103, 105, 107, 110], "timestep": [2, 13, 14, 16, 17, 90, 91, 94, 96, 97, 98, 99, 100, 101, 102, 104], "end": [2, 11, 13, 16, 18, 19, 28, 37, 38, 40, 42, 44, 45, 53, 54, 55, 65, 69, 72, 73, 84, 92, 105, 108, 110], "reach": [2, 11, 17, 18, 28, 30, 40, 43, 44, 61, 64, 72, 73, 87, 88, 89, 90, 91, 94, 96, 97, 98, 99, 100, 101, 102, 104, 105, 108, 109, 110], "necessari": [2, 4, 20, 46, 47, 48, 49, 50], "version": [2, 3, 4, 11, 17, 18, 19, 89, 105], "0": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 110], "26": [2, 16, 17, 18, 94, 97, 98], "wa": [2, 9, 10, 11, 14, 15, 16, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 94, 95, 96, 97, 103, 104, 105], "remov": [2, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 88, 110], "done": [2, 3, 9, 11, 13, 16, 17, 18, 94, 96, 97, 98, 99, 100, 104], "favor": 2, "clearer": 2, "had": 2, "which": [2, 3, 4, 5, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 20, 40, 42, 44, 58, 85, 86, 88, 89, 93, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104, 105, 109, 110], "critic": [2, 13], "bootstrap": [2, 18], "algorithm": [2, 4, 18, 19, 93, 106, 110], "paramet": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 86, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 103, 104], "provid": [2, 4, 5, 6, 9, 10, 11, 12, 13, 14, 16, 17, 19, 20, 26, 40, 42, 46, 47, 48, 49, 50, 84, 88, 105], "element": [2, 4, 5, 6, 8, 10, 14, 16, 17, 19, 89, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 109], "numpi": [2, 4, 6, 8, 10, 11, 12, 14, 16, 17, 105, 108], "arrai": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 17, 19, 86, 105], "posit": [2, 5, 6, 7, 8, 9, 13, 14, 16, 17, 19, 20, 31, 52, 84, 85, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110], "veloc": [2, 5, 7, 8, 16, 19, 84, 86, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "pole": [2, 71, 87, 99, 100, 105], "cartpol": [2, 3, 9, 10, 13, 14, 15, 16, 19, 87, 89, 99, 100, 105], "result": [2, 7, 9, 10, 88, 94, 97, 98, 105, 106, 108, 110], "whether": [2, 3, 6, 9, 13, 17, 18, 19, 33, 86, 94, 95, 96, 97, 103, 104, 107], "defin": [2, 4, 7, 11, 12, 13, 14, 15, 16, 17, 18, 19, 92, 97, 111], "under": [2, 14, 15, 105], "mdp": [2, 13, 16, 90, 91], "task": [2, 5, 11, 14, 16, 17, 18, 56, 62, 65, 85, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 108], "neg": [2, 6, 9, 16, 71, 91, 94, 95, 97, 98, 99, 101, 102], "goal": [2, 16, 17, 23, 26, 31, 33, 35, 37, 40, 52, 57, 58, 59, 60, 61, 63, 66, 68, 70, 71, 77, 78, 79, 80, 81, 82, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 110], "move": [2, 11, 15, 17, 18, 22, 25, 26, 35, 36, 50, 53, 64, 67, 70, 71, 84, 86, 89, 94, 95, 96, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110], "lava": [2, 51], "sutton": [2, 88, 89, 99, 100, 107, 108], "barton": 2, "gridworld": [2, 17, 108], "true": [2, 3, 7, 9, 10, 12, 13, 14, 16, 17, 19, 20, 46, 47, 48, 49, 50, 84, 85, 86, 94, 95, 96, 97, 103, 104, 107, 109], "condit": [2, 16, 18], "outsid": [2, 18, 85, 86], "scope": [2, 18], "satisfi": 2, "typic": [2, 9, 105, 110], "timelimit": [2, 3, 11, 13, 16, 17, 18], "could": [2, 9, 14, 15, 17, 18, 20, 105], "also": [2, 3, 6, 9, 10, 11, 13, 14, 16, 17, 18, 20, 32, 53, 54, 65, 66, 68, 84, 85, 86, 87, 93, 94, 95, 96, 97, 103, 104, 105], "indic": [2, 9, 13, 18, 19, 85, 88, 89, 94, 97, 98, 110], "physic": [2, 83, 93, 99, 100, 105], "go": [2, 18, 19, 44, 71, 75, 85, 107], "out": [2, 8, 17, 18, 20, 29, 34, 51, 54, 62, 67, 72], "bound": [2, 6, 11, 12, 16, 18, 86, 88, 89, 90, 91, 92], "prematur": 2, "auxiliari": [2, 17], "diagnost": 2, "log": 2, "might": [2, 4, 6, 7, 11, 12, 13, 14, 15, 16, 17, 19, 105], "instanc": [2, 3, 4, 5, 7, 8, 9, 10, 11, 13, 15, 16, 19, 105], "describ": [2, 5, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 88, 89, 103, 105, 107], "perform": [2, 9, 13, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 102, 105], "variabl": [2, 4, 6, 10, 13, 17, 18, 96, 103, 104, 105], "hidden": [2, 93, 105], "individu": [2, 11, 17, 19, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "term": [2, 11, 17, 87, 88, 93, 94, 95, 96, 97, 101, 102, 103, 104], "combin": [2, 4, 9, 11, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 51, 52, 53, 54, 55, 56, 57, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 102], "produc": [2, 11, 13, 16, 17, 98], "total": [2, 40, 84, 85, 86, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104, 110], "In": [2, 6, 9, 10, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 85, 87, 88, 94, 95, 96, 97, 103, 104, 105, 108, 110], "openai": [2, 3, 10, 11, 18, 83, 93, 111], "gym": [2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 83, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110, 111], "v26": 2, "distinguish": [2, 17, 18], "howev": [2, 3, 4, 5, 6, 7, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 88, 94, 95, 96, 97, 101, 102, 110], "deprec": [2, 16], "favour": [2, 16], "boolean": [2, 4, 9, 13, 16, 19, 86], "valu": [2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 16, 18, 19, 20, 70, 84, 86, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 109, 110], "case": [2, 4, 5, 6, 11, 12, 14, 16, 17, 18, 19, 53, 65, 85, 94, 95, 96, 97, 103, 104, 110], "further": [2, 70, 86, 101, 102], "undefin": 2, "signal": [2, 11, 13, 16, 17, 18, 94, 96, 97, 104, 110], "mai": [2, 6, 9, 10, 12, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 94, 95, 96, 97, 103, 104, 109], "emit": [2, 11, 13], "differ": [2, 4, 5, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 85, 92, 94, 95, 96, 97, 98, 99, 100, 104, 105], "reason": [2, 86, 105], "mayb": 2, "underli": [2, 11, 13, 16, 88], "solv": [2, 17, 84, 87, 89, 93, 99, 100], "successfulli": 2, "certain": [2, 43, 45, 99, 100, 102], "exceed": [2, 11, 13, 16, 94, 96, 97, 104], "simul": [2, 20, 46, 47, 48, 49, 50, 93, 97, 98, 99, 100, 105], "enter": [2, 9, 16, 27, 29, 56, 86], "invalid": [2, 6], "option": [2, 3, 4, 5, 6, 9, 10, 11, 13, 14, 16, 17, 85, 88, 89, 90, 91, 92], "int": [2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 16, 17, 19, 20], "none": [2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14, 16, 17, 19, 109], "intern": [2, 10, 14], "new": [2, 4, 11, 12, 13, 14, 16, 17, 18, 19, 24, 27, 29, 42, 88, 89, 90, 91, 92, 102, 105], "start": [2, 4, 6, 9, 10, 13, 16, 19, 30, 43, 44, 50, 54, 55, 70, 105, 107, 108, 109, 110], "often": [2, 4, 17, 93], "some": [2, 4, 5, 6, 10, 11, 13, 14, 15, 16, 17, 19, 20, 36, 44, 62, 85, 87, 88, 93, 102, 103, 105, 110], "explor": [2, 4, 50], "generalis": 2, "polici": [2, 14, 15, 18, 19, 87, 93, 94, 95, 96, 97, 98, 103, 104, 105, 111], "control": [2, 4, 6, 15, 16, 20, 22, 25, 27, 28, 29, 30, 31, 36, 38, 41, 48, 49, 50, 53, 55, 62, 63, 65, 67, 68, 69, 70, 71, 72, 75, 76, 83, 85, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "alreadi": [2, 11, 14, 16, 105], "rng": [2, 4, 5, 6, 17], "therefor": [2, 4, 10], "right": [2, 6, 16, 17, 20, 22, 24, 25, 26, 27, 31, 35, 36, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 52, 53, 54, 55, 57, 59, 60, 61, 63, 66, 71, 73, 74, 76, 77, 80, 81, 84, 85, 86, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 103, 104, 108, 109, 110], "after": [2, 3, 9, 10, 13, 14, 16, 17, 18, 19, 28, 32, 37, 43, 47, 51, 73, 86, 94, 95, 96, 97, 98, 103, 104, 105, 107, 110], "never": 2, "again": [2, 17, 86], "custom": [2, 4, 9, 10, 14, 16, 20, 46, 47, 48, 49, 50, 103, 105, 109], "line": [2, 17, 43, 88], "correctli": [2, 14, 15, 17], "v0": [2, 3, 10, 11, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110], "25": [2, 20, 46, 47, 48, 49, 50, 94, 96, 97, 98, 104, 110], "return_info": 2, "now": [2, 16, 17, 18, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "expect": [2, 4, 5, 6, 10, 13], "prng": [2, 4, 5, 6], "doe": [2, 3, 5, 7, 9, 10, 11, 13, 16, 17, 18, 32, 48, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107], "pass": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 85, 86, 94, 95, 96, 97, 103, 104], "chosen": [2, 6, 20], "sourc": [2, 17, 93, 105], "entropi": 2, "timestamp": 2, "dev": [2, 19], "urandom": 2, "integ": [2, 5, 6, 9, 13, 14, 17, 20, 110], "even": [2, 3, 17, 19, 21, 23, 29, 30, 32, 34, 37, 38, 41, 51, 52, 53, 55, 56, 58, 62, 65, 67, 68, 69, 70, 72, 75, 79, 82, 98], "exist": [2, 3, 4, 10, 11, 16, 19], "usual": [2, 5, 6, 11, 13, 16, 17, 20, 46, 47, 48, 49, 50, 52, 96], "want": [2, 5, 10, 11, 12, 13, 15, 16, 17, 29, 51], "been": [2, 9, 13, 16, 17, 18, 94, 97, 98, 105], "refer": [2, 9, 13, 16, 17, 18], "minim": [2, 17, 18, 19], "abov": [2, 5, 6, 9, 16, 20, 46, 47, 48, 49, 50, 88, 89, 92, 93], "paradigm": 2, "specifi": [2, 4, 5, 6, 9, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 86, 87, 92, 96, 97, 101, 102, 104, 105, 106, 109, 110], "how": [2, 4, 9, 10, 16, 17, 18, 19, 52, 54, 55, 98, 99, 101, 102, 105], "depend": [2, 5, 9, 14, 15, 20, 22, 23, 24, 25, 26, 27, 28, 31, 32, 33, 35, 36, 38, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 55, 57, 59, 60, 61, 63, 64, 66, 71, 73, 74, 76, 77, 78, 80, 81, 83, 87, 89, 93, 94, 95, 96, 97, 103, 104, 105, 109], "specif": [2, 3, 6, 13, 16, 18, 105], "analog": [2, 20], "dictionari": [2, 4, 5, 9, 10, 11, 13, 14, 16, 17, 19, 110], "complement": 2, "It": [2, 3, 5, 6, 9, 10, 11, 13, 16, 17, 20, 21, 22, 23, 24, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 51, 52, 53, 54, 55, 56, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 78, 79, 80, 81, 84, 93, 94, 95, 96, 97, 98, 101, 102, 103, 104, 105, 108], "union": [2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 14], "renderfram": [2, 9], "list": [2, 4, 5, 6, 9, 10, 11, 14, 16, 19, 20, 105], "comput": [2, 9, 17, 63, 75, 94, 99, 101, 102, 105], "frame": [2, 9, 13, 14, 20, 33, 85, 86, 98, 101, 105], "render_mod": [2, 9, 10, 11, 13, 14, 16, 17, 20, 111], "wai": [2, 5, 11, 16, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 105], "most": [2, 4, 11, 13, 14, 16, 17, 19, 20, 46, 47, 48, 49, 50, 102], "achiev": [2, 20, 23, 88, 107], "appli": [2, 3, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 84, 86, 87, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107], "collect": [2, 10, 23, 26, 44, 58, 59, 62, 78, 105], "As": [2, 10, 11, 16, 76, 88, 93, 94, 95, 97, 98, 105, 106, 110], "known": [2, 13, 27, 105], "__init__": [2, 5, 8, 11, 12, 14, 15, 17, 19], "initialis": [2, 13], "By": [2, 3, 13, 16, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 88, 94, 95, 96, 97, 103, 104], "continu": [2, 4, 11, 12, 16, 18, 25, 26, 85, 86, 87, 90, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "current": [2, 6, 9, 11, 13, 14, 17, 20, 85, 88, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110], "displai": [2, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 89, 105], "consumpt": 2, "occur": [2, 13, 16, 17, 19, 88, 89], "doesn": [2, 3, 11, 13, 18, 20, 86], "t": [2, 3, 5, 6, 7, 9, 11, 13, 14, 15, 17, 18, 20, 36, 46, 47, 48, 49, 50, 69, 70, 85, 86, 90, 91], "repres": [2, 5, 6, 9, 16, 17, 19, 86, 88, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 109, 110, 111], "np": [2, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 86, 110], "ndarrai": [2, 3, 5, 6, 7, 8, 9, 12, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 110], "shape": [2, 4, 5, 6, 7, 8, 11, 12, 13, 14, 16, 17, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "x": [2, 4, 6, 7, 17, 86, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104, 105], "y": [2, 6, 20, 86, 92, 94, 95, 97, 98, 99, 101, 102, 103, 110], "3": [2, 5, 6, 7, 8, 9, 10, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 110], "rgb": [2, 11, 13, 14, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 85, 94, 95, 96, 97, 98, 99, 100, 103, 104], "pixel": [2, 11, 17, 85, 105], "imag": [2, 4, 10, 11, 13, 14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 85, 105], "string": [2, 4, 6, 9, 14, 19], "str": [2, 3, 4, 5, 6, 7, 9, 10, 13, 14, 20, 94, 95, 96, 97, 103, 104], "stringio": [2, 106], "style": [2, 10, 13, 105], "represent": [2, 18], "each": [2, 3, 4, 5, 6, 9, 10, 11, 12, 14, 16, 17, 19, 20, 40, 42, 43, 44, 45, 48, 56, 63, 65, 66, 67, 68, 69, 70, 71, 83, 84, 86, 87, 88, 89, 90, 91, 94, 97, 98, 99, 100, 101, 105, 106, 108, 110], "includ": [2, 3, 14, 17, 18, 19, 20, 89, 94, 95, 96, 97, 99, 100, 101, 102, 103, 104, 105, 110], "newlin": 2, "escap": [2, 39, 54, 58], "sequenc": [2, 3, 4, 6, 7, 10, 14, 20, 105], "color": [2, 5, 24, 35, 48, 66], "rgb_array_list": [2, 9, 11, 13], "ansi_list": 2, "base": [2, 4, 5, 10, 11, 12, 13, 14, 15, 16, 17, 44, 53, 70, 83, 88, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 110], "except": [2, 16, 17, 67, 70], "rendercollect": [2, 11, 13], "pop": [2, 16, 102], "sure": [2, 13, 16, 17], "kei": [2, 3, 4, 5, 6, 9, 10, 11, 13, 14, 16, 17, 18, 19, 20, 21, 52, 94, 95, 96, 97, 101, 102, 103, 104, 105, 110], "support": [2, 4, 5, 7, 9, 10, 11, 13, 14, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 88, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "longer": [2, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 94, 96, 97, 98, 99, 100, 101, 102, 104, 105], "accept": [2, 9, 13, 17, 20], "rather": [2, 85, 105], "v1": [2, 3, 9, 10, 13, 14, 15, 16, 19, 84, 85, 86, 88, 89, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 109, 110], "type": [2, 4, 5, 6, 10, 11, 12, 14, 16, 17, 19, 42, 85, 94, 95, 96, 97, 103, 104, 105], "discret": [2, 4, 5, 7, 8, 10, 12, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 85, 86, 88, 89, 90, 91, 105, 106, 107, 108, 109, 110], "give": [2, 23, 24, 42, 43, 86, 101, 107, 110], "2": [2, 5, 6, 7, 8, 9, 10, 12, 14, 15, 16, 17, 19, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 33, 35, 36, 38, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 52, 54, 57, 59, 60, 61, 63, 64, 66, 71, 73, 74, 75, 76, 77, 78, 80, 81, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 110], "mean": [2, 16, 17, 19, 88, 94, 95, 96, 101], "two": [2, 5, 6, 9, 10, 13, 16, 17, 19, 20, 22, 33, 75, 84, 86, 88, 90, 91, 93, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104, 107], "1": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110], "box": [2, 4, 5, 7, 8, 10, 11, 12, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "4028234663852886e": 2, "38": [2, 97, 98], "4": [2, 6, 7, 9, 10, 11, 12, 13, 14, 16, 17, 19, 20, 22, 24, 25, 26, 27, 29, 31, 33, 35, 36, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 54, 57, 59, 60, 61, 63, 64, 65, 66, 73, 74, 76, 77, 78, 80, 81, 84, 86, 88, 89, 90, 91, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 108, 109, 110], "float32": [2, 5, 6, 7, 8, 10, 11, 12, 14, 16, 19, 84, 85, 86, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "denot": [2, 89], "we": [2, 6, 13, 14, 15, 16, 17, 18, 19, 20, 94, 97, 98, 105], "check": [2, 6, 13, 17, 110], "well": [2, 4, 17, 19, 27, 70, 88, 94, 97, 98, 105], "high": [2, 5, 6, 7, 8, 10, 14, 16, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "8000002e": 2, "00": 2, "4028235e": 2, "1887903e": 2, "01": [2, 15, 86, 94, 95, 98, 99, 100, 101, 102, 103], "dtype": [2, 4, 5, 6, 8, 10, 14, 16, 17, 19, 86], "low": [2, 5, 6, 7, 8, 14, 16, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "ani": [2, 4, 5, 8, 9, 13, 14, 16, 17, 18, 19, 20, 42, 46, 47, 48, 49, 50, 51, 69, 86, 89, 94, 96, 97, 98, 99, 100, 101, 102, 103, 104, 109], "etc": [2, 4, 11, 16, 17, 18, 19, 65, 68, 72, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "determin": [2, 6, 17, 18, 20, 86, 88, 89, 90, 91, 92, 105], "inf": [2, 14, 89, 90, 91, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "envspec": [2, 3], "normal": [2, 6, 11, 13, 84, 85, 92, 94, 95, 99], "finish": [2, 85, 86], "code": [2, 4, 5, 9, 10, 11, 13, 14, 15, 16, 17, 19, 88, 105], "clean": 2, "up": [2, 5, 6, 10, 14, 16, 17, 20, 21, 23, 24, 25, 26, 27, 29, 30, 31, 33, 36, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 53, 54, 57, 59, 64, 66, 67, 68, 70, 71, 74, 75, 76, 77, 80, 81, 84, 86, 93, 94, 97, 98, 102, 107, 108, 109, 110], "window": [2, 9, 16, 17, 40, 85, 105], "http": [2, 9, 11, 17, 20, 85, 88, 93, 105, 107, 108], "connect": [2, 5, 88, 94, 95, 96, 102, 103, 104], "properti": [2, 4, 11, 18, 19], "unwrap": [2, 11, 16, 88], "non": [2, 4, 7, 9, 17, 18], "wrap": [2, 3, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19], "_np_random": 2, "meth": 2, "much": [2, 17, 18, 20, 46, 47, 48, 49, 50, 54, 55, 98], "creat": [2, 3, 6, 8, 9, 10, 13, 16, 30, 84, 85, 86, 101, 102, 105, 106], "more": [2, 4, 5, 6, 9, 10, 11, 14, 16, 17, 18, 19, 20, 21, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 41, 46, 51, 52, 53, 54, 55, 56, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 84, 86, 93, 94, 97, 98, 99, 100, 101, 102, 103, 105], "creation": [2, 10, 17], "tutori": 2, "gymnasium": [3, 4, 5, 6, 7, 8, 9, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110], "allow": [3, 4, 5, 9, 11, 12, 14, 15, 16, 17, 20, 51, 69, 88, 89, 90, 91, 92, 99, 100, 101, 102], "load": 3, "pre": 3, "sever": [3, 6, 11, 13, 20, 50, 105], "id": [3, 10, 16, 17, 109], "kwarg": [3, 9, 10, 11, 17, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "env": [3, 9, 11, 12, 13, 14, 15, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 108, 109, 110, 111], "liter": 3, "mountaincar": [3, 19, 90], "mountaincarcontinu": [3, 91], "supportsfloat": [3, 6, 11], "pendulum": [3, 10, 14, 19, 87, 88, 89, 93], "acrobot": [3, 87, 105], "lunarland": [3, 13, 16, 86, 105, 111], "v2": [3, 12, 13, 16, 84, 85, 86, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 110, 111], "lunarlandercontinu": [3, 12], "bipedalwalk": [3, 11, 12, 16, 84], "v3": [3, 11, 12, 16, 84, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 110], "bipedalwalkerhardcor": 3, "carrac": [3, 9, 14, 85], "blackjack": [3, 106], "frozenlak": [3, 9, 19, 109], "frozenlake8x8": 3, "cliffwalk": [3, 108], "taxi": [3, 106], "reacher": [3, 11, 93, 101], "v4": [3, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "pusher": 3, "invertedpendulum": [3, 93, 99, 100], "inverteddoublependulum": [3, 99], "halfcheetah": [3, 93, 95], "hopper": [3, 93, 104], "swimmer": [3, 93], "walker2d": [3, 93], "ant": [3, 93, 96, 104], "humanoidstandup": [3, 93, 98], "humanoid": [3, 41, 93, 94], "accord": [3, 5, 6, 10, 86], "given": [3, 6, 11, 14, 18, 19, 67, 70, 84, 86, 87, 88, 90, 91, 94, 96, 97, 104], "find": [3, 17, 20, 21, 46, 47, 48, 49, 50, 56, 65, 77, 99, 102, 105], "avail": [3, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 86, 105], "modul": [3, 8, 17], "eg": [3, 9, 17, 105], "max_episode_step": [3, 13, 17], "length": [3, 5, 6, 9, 11, 13, 14, 19, 84, 88, 89, 90, 91, 95, 103, 105], "autoreset": [3, 10, 17], "autoresetwrapp": [3, 11, 13, 17], "apply_api_compat": [3, 13, 16], "stepapicompat": [3, 11, 13, 16], "convert": [3, 4, 5, 11, 13, 14, 85, 105], "argument": [3, 4, 5, 6, 7, 9, 10, 14, 16, 17, 83, 87, 106], "fals": [3, 9, 10, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 85, 86, 94, 95, 96, 97, 103, 104, 107, 109], "disable_env_check": [3, 10], "checker": [3, 10], "addit": [3, 4, 10, 11, 13, 17, 20, 26, 37, 67, 71, 86, 87, 88, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 110], "constructor": [3, 4, 5, 6, 9, 11, 16, 17], "rais": [3, 6, 7, 8, 9, 10, 13, 14, 19, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "error": [3, 6, 9, 11, 13, 18, 19], "entry_point": [3, 17], "callabl": [3, 8, 9, 10, 13, 14, 15, 19], "reward_threshold": [3, 17, 94, 95, 96, 97, 98, 101, 102, 103, 104], "nondeterminist": [3, 17], "order_enforc": [3, 17], "syntax": 3, "namespac": [3, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "env_nam": 3, "v": [3, 6, 69, 99], "keyword": [3, 5, 10, 14, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 107], "entri": 3, "point": [3, 7, 9, 11, 16, 18, 20, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 41, 42, 43, 44, 45, 47, 51, 52, 55, 62, 63, 64, 65, 66, 67, 68, 70, 72, 73, 74, 76, 77, 80, 84, 85, 86, 88, 89, 92, 102, 105, 107], "threshold": [3, 17, 88, 89, 110], "consid": [3, 14, 17, 85, 86, 87, 93, 94, 96, 97, 104, 105], "learnt": 3, "knowledg": 3, "limit": [3, 16, 36, 44, 51, 52, 65, 70, 99, 100], "enabl": [3, 11, 19, 20, 85, 105], "order": [3, 4, 5, 11, 16, 17, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 93, 94, 95, 96, 97, 98, 99, 100, 101, 104, 105], "enforc": 3, "correct": [3, 17, 18, 110], "disabl": [3, 13], "recommend": [3, 10, 13, 17, 20, 46, 47, 48, 49, 50, 86, 94, 97, 98, 105], "onli": [3, 4, 5, 6, 7, 10, 11, 12, 13, 14, 16, 17, 19, 20, 22, 24, 25, 26, 27, 28, 31, 33, 35, 36, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 52, 54, 57, 59, 60, 61, 63, 64, 66, 67, 68, 69, 70, 71, 73, 74, 76, 77, 78, 80, 81, 90, 91, 94, 95, 96, 97, 99, 101, 102, 104, 105], "env_id": 3, "retriev": [3, 13, 41, 44, 70], "global": 3, "superclass": [4, 12, 14, 15], "crucial": 4, "thei": [4, 10, 13, 14, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 102, 106, 107], "serv": [4, 94, 95, 96, 97, 103, 104], "variou": [4, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 98, 105], "purpos": [4, 105], "clearli": 4, "interact": [4, 9, 17, 20, 105], "environ": [4, 6, 8, 11, 12, 14, 15, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 106, 107, 108, 109, 110], "look": [4, 9, 11, 13, 15, 16, 17, 18, 20, 22, 24, 25, 26, 27, 28, 31, 33, 35, 36, 40, 42, 43, 44, 45, 54, 57, 59, 60, 61, 63, 64, 66, 69, 71, 73, 74, 76, 77, 78, 80, 81], "like": [4, 6, 9, 11, 12, 13, 14, 15, 16, 17, 19, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 35, 36, 40, 42, 43, 44, 45, 54, 57, 59, 60, 61, 62, 63, 64, 65, 66, 71, 73, 74, 76, 77, 78, 80, 81, 84, 86, 94, 95, 97, 98, 100, 101, 102, 104, 105], "u": [4, 6, 11, 15, 17, 20, 105, 106], "work": [4, 9, 11, 13, 14, 20, 85, 86, 88, 95, 96, 99, 100, 104, 105], "highli": [4, 17, 20, 83, 87], "structur": [4, 5, 7, 17, 19, 105], "data": [4, 7, 9, 11, 16, 17, 19], "form": [4, 5, 6, 13, 17, 19, 88, 103], "painlessli": 4, "transform": [4, 7, 9, 11, 12, 13, 16, 102], "them": [4, 11, 13, 16, 20, 22, 23, 24, 27, 28, 32, 36, 43, 64, 73, 86, 95, 102, 105], "flat": [4, 5, 6, 7, 14], "sampl": [4, 5, 6, 7, 8, 9, 10, 14, 15, 16, 17, 19, 86, 110], "especi": [4, 15, 17, 19], "hierarch": [4, 110], "via": [4, 5, 11, 13, 14, 15, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 87, 93, 105, 106], "build": [4, 11, 22, 40, 44, 99, 104, 105], "express": [4, 9, 94, 97, 98], "inherit": [4, 11, 12, 14, 15, 16, 17, 19], "cover": [4, 19], "note": [4, 8, 13, 16, 18, 19, 88, 89, 94, 97, 98, 110], "parametr": 4, "probabl": [4, 18, 20, 109, 110], "distribut": [4, 5, 6, 103], "batch": [4, 8, 10, 19], "vectorenv": [4, 19], "moreov": [4, 13, 17, 19, 20, 23, 33], "implement": [4, 5, 10, 12, 13, 14, 15, 16, 17, 19, 20, 92, 99, 105, 106, 108], "handl": [4, 10, 16, 99], "care": [4, 19, 71], "immut": 4, "mask": [4, 5, 6, 19, 105, 110], "t_cov": 4, "randomli": [4, 5, 17, 86], "uniform": [4, 6, 19, 90, 91, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "bounded": 4, "int8": [4, 6], "member": [4, 54], "possibli": [4, 5, 6, 8, 11, 13, 16, 105], "subspac": [4, 5, 6, 7], "to_json": 4, "sample_n": 4, "jsonabl": 4, "from_json": 4, "complex": [4, 5, 97, 98, 99, 100, 105], "matric": 4, "multidiscret": [4, 5, 7, 8, 10, 16, 17, 19], "binari": [4, 6, 16, 17, 19], "hold": [4, 107], "down": [4, 6, 17, 18, 19, 20, 24, 26, 27, 33, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 53, 54, 57, 59, 61, 62, 64, 66, 74, 76, 77, 80, 81, 85, 98, 107, 108, 109], "button": [4, 6, 9], "multibinari": [4, 5, 7, 8, 16], "multipl": [4, 5, 6, 8, 10, 16, 19, 105], "ax": [4, 6, 17], "messag": [4, 105], "mission": [4, 53, 55, 56], "detail": [4, 9, 13, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 88, 105], "join": 4, "togeth": [4, 19, 20, 93], "vectoris": 4, "separ": [4, 5, 16, 17], "readabl": [4, 5], "fix": [4, 5, 6, 11, 13, 15, 16, 17, 53, 88, 89, 92, 93, 94, 95, 96, 97, 99, 100, 104, 109, 110], "unord": 4, "entiti": 4, "select": [4, 6, 43, 94, 97, 98, 101, 102, 105], "graph": [4, 7], "node": [4, 5, 7], "edg": [4, 5, 7, 89], "flatten": [4, 7, 11, 17, 93, 108], "unflatten": [4, 7], "neural": [4, 7, 19, 88, 103, 105], "network": [4, 7, 19, 103, 105], "flatdim": [4, 7, 19], "dimens": [4, 6, 7, 14, 19, 94, 95, 96, 97, 103, 104, 105], "flatten_spac": [4, 7], "revers": [4, 7, 107], "size": [4, 13, 17, 19, 109], "batch_spac": [4, 8], "concaten": [4, 7, 8, 93], "iter": [4, 5, 8, 10], "create_empty_arrai": [4, 8], "create_shared_memori": [4, 8], "read_from_shared_memori": [4, 8], "write_to_shared_memori": [4, 8], "spaces_kwarg": 5, "constitu": 5, "usag": [5, 6, 7, 11, 85], "ordereddict": [5, 8, 14, 16], "nest": [5, 8, 19, 105], "ext_control": 5, "5": [5, 6, 7, 8, 12, 13, 16, 17, 19, 20, 22, 24, 25, 26, 27, 30, 31, 33, 36, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 57, 59, 60, 61, 63, 64, 66, 73, 74, 76, 77, 78, 80, 81, 84, 85, 86, 88, 90, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104, 105, 107, 110], "inner_st": 5, "charg": 5, "100": [5, 7, 13, 19, 34, 44, 67, 68, 84, 85, 86, 88, 91, 96, 101, 105, 108], "system_check": 5, "10": [5, 6, 12, 17, 20, 27, 33, 46, 47, 48, 49, 50, 57, 64, 67, 70, 84, 86, 92, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104, 105, 107, 108, 110], "job_statu": 5, "progress": [5, 16, 76], "conveni": [5, 11, 16, 17, 19], "easili": [5, 11, 16, 105], "flattenobserv": [5, 11, 14, 17], "similar": [5, 17, 19, 24, 35, 101], "deal": 5, "instanti": [5, 9, 13, 14, 15, 17, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "either": [5, 6, 7, 9, 13, 19, 20, 43, 53, 90, 91, 107, 109], "avoid": [5, 8, 11, 16, 19, 20, 23, 24, 26, 31, 32, 40, 42, 58, 59, 61, 66, 68, 69, 74], "independ": [5, 6, 10, 19, 96, 102, 103, 104], "same": [5, 7, 9, 10, 14, 16, 18, 19, 52, 84, 85, 88, 101, 102, 103, 110], "attr": 5, "warn": [5, 9, 10, 13, 16], "guarante": [5, 20], "uniqu": [5, 83, 87, 93, 99], "sub": [5, 10, 70], "precis": 5, "cartesian": [5, 6, 92], "product": [5, 6], "03633198": 5, "42370757": 5, "involv": [5, 17, 83, 99, 100, 105, 109], "reproduc": [5, 16], "insid": [5, 6, 13, 17, 19], "method": [5, 9, 12, 13, 14, 15, 16, 17, 19, 105, 110], "draw": [5, 17, 107], "42": [5, 6, 16, 89, 97, 98, 111], "54": 5, "finit": [5, 6, 12, 18, 94, 98, 99, 100, 101, 102, 104], "a_0": 5, "dot": [5, 6, 17, 19], "a_n": 5, "a_i": 5, "belong": [5, 8, 105], "n": [5, 6, 7, 8, 16, 19, 20, 39, 85, 88, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "0259352": 5, "80977976": 5, "80066574": 5, "77165383": 5, "must": [5, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 25, 27, 28, 29, 30, 32, 36, 37, 38, 41, 44, 45, 54, 58, 60, 61, 66, 85, 96, 104, 105], "length_mask": 5, "sample_mask": 5, "drawn": [5, 6, 101, 103], "geometr": 5, "second": [5, 9, 10, 16, 33, 64, 71, 86, 95, 99, 102, 103, 105], "featur": [5, 6, 105], "feature_spac": 5, "node_spac": [5, 7], "edge_spac": [5, 7], "seri": [5, 16], "adjac": 5, "matrix": [5, 108], "edge_link": [5, 7], "num_nod": 5, "num_edg": 5, "graphinst": [5, 7], "between": [5, 6, 13, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 86, 88, 89, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "don": [5, 11, 17, 18, 20, 36, 46, 47, 48, 49, 50, 70, 85, 90], "edge_mask": 5, "multipli": [5, 91], "attribut": [5, 16, 17, 101, 102], "_gener": 6, "unbound": 6, "mathbb": 6, "interv": [6, 16, 94, 96, 97, 104], "There": [6, 11, 16, 17, 52, 53, 65, 84, 85, 86, 87, 90, 91, 93, 98, 99, 100, 101, 102, 105, 107, 108, 110], "common": [6, 11, 14, 16, 18], "ident": [6, 10, 14, 19], "lower": [6, 16, 94, 95, 96, 97, 98, 101, 102, 103, 104], "upper": [6, 16, 97, 98], "construct": [6, 20, 46, 47, 48, 49, 50, 88, 94, 95, 96, 97, 103, 104], "scalar": [6, 12], "respect": [6, 10, 11, 13, 16, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 86, 88, 94, 97, 98, 103], "assum": [6, 14, 17], "across": [6, 8, 26, 36, 47, 48, 51], "infer": [6, 93], "essenti": 6, "valueerror": [6, 7, 8, 10, 13, 14, 19], "coordin": [6, 11, 14, 84, 86, 92, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104, 105], "shift": [6, 16], "exponenti": [6, 11, 15], "unsupport": 6, "is_bound": 6, "manner": [6, 11, 14, 52], "both": [6, 10, 13, 14, 16, 17, 18, 84, 87, 88, 102, 104, 105, 107, 109, 110], "sens": [6, 105], "One": [6, 16, 94, 97, 98, 105], "neither": [6, 13, 107], "nor": [6, 13, 107, 108], "consist": [6, 11, 14, 16, 17, 20, 33, 84, 88, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107], "mani": [6, 13, 14, 16, 17, 20, 26, 29, 33, 52, 55, 70, 80, 105], "subset": [6, 12, 17, 20, 46, 47, 48, 49, 50], "smallest": 6, "uniformli": [6, 17, 20, 88, 89, 101, 102], "infeas": 6, "sort": 6, "fair": 6, "coin": [6, 105], "toss": 6, "per": [6, 10, 18, 19, 33, 52, 75, 105, 110], "nvec": 6, "int64": [6, 7], "game": [6, 9, 13, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 59, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 107], "keyboard": [6, 9, 16], "alwai": [6, 7, 13, 17, 20, 86, 90, 91, 94, 97, 98, 101, 103, 109, 110], "noop": [6, 9, 13, 20, 22, 24, 25, 26, 27, 28, 31, 33, 35, 36, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 57, 59, 60, 61, 63, 64, 66, 71, 73, 74, 76, 77, 78, 80, 81], "nintendo": 6, "conceptu": 6, "arrow": [6, 16, 64], "left": [6, 16, 17, 20, 22, 24, 25, 26, 27, 31, 35, 36, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 52, 53, 54, 57, 59, 60, 61, 63, 66, 70, 71, 73, 74, 76, 77, 80, 81, 84, 85, 86, 89, 90, 94, 97, 98, 99, 100, 104, 108, 109], "param": 6, "min": [6, 12, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "max": [6, 12, 13, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "press": [6, 9, 16, 85, 88], "although": 6, "rare": 6, "d": [6, 9, 88, 101, 102], "categor": 6, "vector": [6, 9, 11, 84, 86, 98, 99, 100, 101, 102, 109], "count": [6, 84, 86, 107], "complic": [6, 11, 16], "kind": 6, "unless": [6, 11, 17, 110], "max_length": 6, "min_length": 6, "charset": 6, "frozenset": 6, "6": [6, 7, 20, 24, 25, 26, 27, 31, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 57, 59, 61, 75, 76, 77, 80, 81, 88, 90, 91, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104, 108, 110], "7": [6, 9, 19, 20, 24, 26, 27, 31, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 57, 59, 61, 76, 77, 80, 81, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104], "8": [6, 9, 10, 19, 20, 22, 24, 26, 27, 29, 31, 35, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 57, 59, 60, 76, 80, 81, 85, 86, 88, 89, 92, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104, 109], "9": [6, 8, 10, 19, 20, 24, 27, 32, 41, 46, 47, 48, 49, 50, 54, 57, 67, 76, 81, 88, 92, 94, 95, 96, 97, 98, 99, 101, 102, 104, 107], "c": [6, 19, 69, 86, 88, 105], "f": [6, 14, 15, 109], "h": [6, 109], "j": [6, 20], "k": [6, 7, 9, 13, 86, 103], "l": [6, 13, 103], "m": [6, 7, 17, 19, 20, 39, 88, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "o": [6, 19], "p": [6, 95, 109, 110], "q": [6, 18, 66, 110], "w": [6, 9, 16, 94, 97, 98], "z": [6, 94, 95, 96, 97, 98, 101, 102, 104], "compris": 6, "charact": [6, 9, 54, 65], "b5": 6, "hello": 6, "0123456789": 6, "digit": [6, 105], "inclus": [6, 20], "prevent": [6, 10, 43, 105], "empti": [6, 8, 13, 70], "english": 6, "alphabet": 6, "plu": [6, 36, 108], "latin": 6, "charlist": 6, "zero": [6, 8, 17, 18, 19, 92, 95, 105], "matter": 6, "equival": [7, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "would": [7, 12, 14, 15, 16, 17, 94, 95, 96, 97, 98, 103, 104], "notimplementederror": 7, "cannot": [7, 8, 13, 17, 18, 108], "attempt": [7, 19, 86, 98, 99], "compound": 7, "func": 7, "oper": [7, 13, 19], "itself": [7, 10, 11, 13, 16], "boundari": 7, "while": [7, 17, 18, 19, 20, 23, 24, 40, 55, 58, 59, 60, 61, 64, 66, 68, 70, 74, 77, 79, 86, 88, 89, 92, 94, 95, 97, 98, 101, 102, 103, 105, 107], "being": [7, 13, 16, 41, 90, 91, 92, 94, 97, 98, 102, 105, 110], "exactli": [7, 103], "origin": [7, 10, 12, 13, 14, 85, 88, 99, 101, 102, 105], "effect": [7, 8, 11, 13, 14, 16, 20, 46, 47, 48, 49, 50, 86, 99, 100, 110], "flattenend": 7, "60": [7, 54, 67, 105], "recurs": 7, "12": [7, 20, 27, 29, 33, 35, 46, 47, 48, 49, 50, 54, 57, 69, 86, 88, 89, 94, 95, 96, 97, 98, 101, 104], "hot": 7, "match": [7, 10, 12, 75], "copi": [8, 10, 17, 19, 105], "item": [8, 9, 105], "_": [8, 9, 10, 11, 16, 111], "6348213": 8, "28607962": 8, "60760117": 8, "87383074": 8, "192658": 8, "2148103": 8, "output": [8, 9, 13, 16], "99644893": 8, "08304597": 8, "7238421": 8, "35848552": 8, "1533453": 8, "67958736": 8, "49076623": 8, "38661423": 8, "7975036": 8, "93317133": 8, "stopiter": 8, "fn": 8, "built": [8, 105], "multi_binari": 8, "multi_discret": 8, "ctx": 8, "multiprocess": [8, 10, 19], "opt": 8, "hostedtoolcach": 8, "14": [8, 20, 46, 47, 48, 49, 50, 54, 84, 86, 94, 95, 97, 98, 101, 104], "x64": 8, "lib": [8, 108], "python3": 8, "process": [8, 9, 10, 14, 17, 18, 19, 88, 101], "eventu": 8, "shared_memori": [8, 10, 19], "customspaceerror": 8, "read": [8, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110], "forward": [8, 31, 53, 84, 94, 95, 96, 97, 98, 103, 104], "vice": [8, 13], "versa": [8, 13], "side": [8, 14, 22, 35, 50, 52, 86], "write": [8, 10, 17, 19], "num_env": [8, 10, 19], "plai": [9, 17, 30, 43, 56, 75, 80, 85, 105, 107], "transpos": [9, 17], "zoom": 9, "callback": [9, 16], "keys_to_act": [9, 16], "dw": 9, "so": [9, 10, 11, 13, 14, 16, 17, 18, 19, 20, 48, 71, 86, 87, 94, 95, 96, 97, 98, 99, 100, 103, 104, 105], "particularli": [9, 13, 19, 89], "verifi": 9, "level": [9, 20, 27, 44, 66, 74, 105], "preprocess": [9, 11], "unplay": 9, "wish": [9, 14, 16], "plot": [9, 16], "real": [9, 16, 52, 95, 105], "statist": [9, 16], "playplot": [9, 16], "here": [9, 16, 17, 88], "last": [9, 13, 16, 17, 18, 19, 42, 43, 53, 95, 98, 101, 102], "150": 9, "def": [9, 11, 12, 14, 15, 16, 17, 19], "obs_t": [9, 16], "obs_tp1": [9, 16], "rew": [9, 16, 18], "plotter": [9, 16], "execut": [9, 12, 17, 19, 20, 43, 105, 110], "render_fp": [9, 13, 17], "30": [9, 13, 16, 20, 64, 67, 97, 98], "amount": [9, 40, 42, 43, 45, 51, 70, 84, 89, 99, 100], "input": [9, 10, 16, 19], "receiv": [9, 10, 16, 18, 19, 30, 33, 37, 40, 41, 47, 53, 56, 85, 86, 91, 104], "map": [9, 14, 16, 17, 38, 109, 110], "unicod": 9, "suppos": [9, 16], "trigger": [9, 110], "key_to_act": [9, 16], "ord": [9, 16, 17], "unknown": [9, 105], "horizon_timestep": 9, "plot_nam": 9, "live": [9, 23, 26, 29, 30, 32, 35, 40, 41, 44, 51, 55, 56, 62, 68, 73], "transit": [9, 16, 18, 20, 46, 47, 48, 49, 50, 97, 98, 110], "compute_metr": 9, "obs_tp": 9, "cumulative_reward": 9, "linalg": [9, 17], "norm": [9, 17, 101, 102], "its": [9, 10, 12, 13, 35, 42, 65, 77, 82, 86, 92, 93, 103, 105], "along": [9, 11, 16, 19, 54, 55, 57, 68, 85, 89, 90, 91, 95, 99, 100, 103], "conjunct": 9, "evolv": 9, "200": [9, 45, 68, 86, 88, 89, 90, 92], "immedi": [9, 11, 15, 17, 107], "cumul": [9, 11, 13], "magnitud": [9, 86, 91, 99, 100], "your_env": 9, "len": [9, 12], "horizon": [9, 18, 70, 96, 104], "titl": [9, 90, 91], "dependencynotinstal": [9, 13], "matplotlib": 9, "playablegam": 9, "process_ev": 9, "event": [9, 17, 105], "particular": [9, 11, 14, 18, 19, 86], "keep": [9, 11, 13, 17, 28, 41, 60, 63, 71, 72, 80, 89, 98], "track": [9, 11, 13, 72, 85, 89, 94, 95, 96, 97, 98, 99, 100, 103, 104], "exit": [9, 10], "save_video": 9, "video_fold": [9, 13], "episode_trigg": [9, 13], "step_trigg": [9, 13], "video_length": [9, 13], "name_prefix": [9, 13], "rl": [9, 13, 16, 18, 111], "episode_index": 9, "step_starting_index": 9, "extract": 9, "compos": 9, "record": [9, 11, 84], "store": [9, 10, 13], "iff": [9, 13, 17], "isn": 9, "entir": [9, 13, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 96, 104, 105], "snippet": [9, 13], "captur": [9, 13, 79], "Will": [9, 13], "prepend": [9, 13], "filenam": [9, 13], "moviepi": 9, "imagesequenceclip": 9, "durat": [9, 94, 96, 97, 98, 99, 100, 101, 102, 104], "step_index": 9, "199": 9, "capped_cubic_video_schedul": 9, "episode_id": 9, "27": [9, 88, 94, 97, 98], "729": 9, "1000": [9, 13, 16, 19, 68, 70, 85, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 111], "2000": [9, 84], "3000": 9, "schedul": [9, 109], "step_api_compat": 9, "step_return": 9, "output_truncation_bool": [9, 13, 16], "is_vector_env": 9, "doc": [9, 13, 86], "ob": [9, 11, 14, 110], "interfac": [9, 105, 111], "conflict": [9, 105], "written": [9, 11, 105], "final": [9, 10, 13, 17, 18, 53], "desir": [9, 103, 104], "oldenv": 9, "vec_env": 9, "convert_to_terminated_truncated_step_api": 9, "irrespect": 9, "convert_to_done_step_api": 9, "omit": [9, 93, 94, 95, 96, 97, 98, 103, 104], "env_check": [9, 16], "check_env": [9, 16], "skip_render_check": [9, 16], "invas": [9, 74], "farama": [9, 11, 17], "org": [9, 20, 93, 105], "content": 9, "environment_cr": 9, "ignor": [9, 20, 107], "skip": [9, 13, 17, 20], "ci": 9, "parallel": [10, 19], "linear": [10, 19, 86, 88, 99, 100, 103], "speed": [10, 31, 84, 85, 105, 110], "taken": [10, 13, 17, 19, 44, 50, 87, 89, 110], "wait": [10, 18, 44, 46, 70], "until": [10, 11, 17, 43, 56, 101, 107], "overwritten": [10, 11], "final_observ": [10, 13, 19], "final_info": [10, 13], "asyncvectorenv": [10, 19], "syncvectorenv": [10, 19], "single_observation_spac": [10, 19], "single_action_spac": [10, 19], "v25": 10, "old": [10, 11, 13, 16], "vectorlistinfo": [10, 11, 13], "rememb": [10, 13, 17, 85], "share": 10, "other": [10, 11, 12, 13, 14, 17, 19, 26, 35, 38, 46, 52, 86, 92, 93, 95, 99, 101, 102, 104, 110], "word": [10, 101], "02240574": 10, "03439831": 10, "03904812": 10, "02810693": 10, "01586068": 10, "01929009": 10, "02394426": 10, "04016077": 10, "01314174": 10, "03893502": 10, "02400815": 10, "0038326": 10, "instead": [10, 14, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 88, 104], "00122802": [10, 19], "16228443": [10, 19], "02521779": [10, 19], "23700266": [10, 19], "00788269": [10, 19], "17490888": [10, 19], "03393489": [10, 19], "31735462": [10, 19], "04918966": [10, 19], "19421194": [10, 19], "02938497": [10, 19], "29495203": [10, 19], "releas": [10, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 88, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 110], "resourc": [10, 17], "viewer": 10, "close_extra": 10, "synchron": 10, "asynchron": 10, "garbag": 10, "program": [10, 105], "04456399": 10, "04653909": 10, "01326909": 10, "02099827": 10, "03073904": 10, "00145001": 10, "03088818": 10, "03131252": 10, "03468829": 10, "01500225": 10, "01230312": 10, "01825218": 10, "registri": 10, "env_fn": [10, 19], "context": [10, 19], "daemon": 10, "worker": [10, 19, 64], "pipe": 10, "commun": 10, "lambda": [10, 14, 15, 19], "81": [10, 19, 92], "62": [10, 19], "8286432": 10, "5597771": 10, "90249056": 10, "85009176": 10, "5266346": 10, "60007906": 10, "back": [10, 11, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 48, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 94, 95], "improv": 10, "effici": [10, 14, 90, 91, 99, 105], "larg": [10, 11, 19, 91, 94, 95, 96, 97, 98, 101, 102, 103, 104, 105], "subprocess": 10, "flag": [10, 90, 105], "turn": [10, 13, 16, 23, 24, 85, 86, 99], "quit": [10, 17], "head": [10, 95], "spawn": [10, 19, 102], "children": 10, "overrid": [10, 11], "inner": 10, "logic": [10, 17, 85], "advanc": [10, 88, 105], "degre": [10, 14, 97, 98, 99], "flexibl": [10, 105], "chanc": 10, "shoot": [10, 27, 36, 38, 43, 44, 51, 52, 61, 64, 68, 73, 74, 82], "yourself": [10, 17, 19, 44, 64, 85], "foot": [10, 95, 96, 104], "thu": [10, 20, 46, 47, 48, 49, 50, 101, 102, 105], "own": [10, 19, 35, 70], "_worker": 10, "_worker_shared_memori": 10, "runtimeerror": [10, 19], "serial": 10, "modular": [11, 12, 14, 15, 16, 17, 105], "behavior": [11, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 92, 94, 95, 96, 97, 98, 103, 104, 105], "modif": [11, 16, 101, 102], "without": [11, 16, 17, 42, 97, 107, 109], "alter": [11, 16, 17, 20], "lot": [11, 16], "boilerpl": [11, 16, 17], "chain": [11, 16, 88, 103], "rescaleact": [11, 12, 16], "base_env": [11, 16], "wrapped_env": [11, 12, 13, 16, 17], "min_act": [11, 12, 16], "max_act": [11, 12, 16], "access": [11, 13, 19, 51, 105], "underneath": [11, 16, 89], "anoth": [11, 18, 19, 35, 97, 98, 100, 101, 102, 104, 110], "orderenforc": [11, 13, 17], "get": [11, 16, 18, 19, 20, 40, 43, 44, 45, 52, 62, 63, 64, 65, 67, 68, 69, 74, 84, 86, 94, 96, 97, 99, 107], "layer": [11, 16, 105], "bare": 11, "just": [11, 16, 46, 52, 69, 100, 102], "box2d": [11, 16, 84, 85, 86], "bipedal_walk": [11, 16, 84], "0x7f87d70712d0": [11, 16], "three": [11, 16, 17, 20, 23, 26, 28, 41, 49, 55, 62, 67, 68, 69, 70, 94, 96, 97, 98, 103, 104], "thing": [11, 14, 16, 19, 20], "do": [11, 13, 14, 15, 16, 17, 20, 33, 45, 66, 70, 71, 85, 86, 88, 94, 95, 96, 97, 103, 104, 105], "Such": [11, 16], "actionwrapp": [11, 12, 16], "observationwrapp": [11, 14, 16, 17], "rewardwrapp": [11, 15, 16], "present": [11, 17, 18, 88, 105], "section": [11, 16, 17, 19, 20, 71, 94, 95, 96, 97, 103, 104], "found": [11, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 93], "github": [11, 17, 93, 108], "com": [11, 17, 93, 105, 108], "foundat": [11, 17], "forget": [11, 17], "commonli": [11, 16], "page": [11, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 110], "descript": [11, 17, 105], "ataripreprocess": [11, 13], "misc": 11, "tp": 11, "atari": [11, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "clipact": [11, 12, 16], "clip": [11, 15, 16, 17, 90, 91, 94, 97], "envcompat": [11, 13], "compat": [11, 14, 19, 105], "21": [11, 94, 97, 98, 101, 107], "filterobserv": [11, 14], "filter": 11, "request": [11, 107], "framestack": [11, 13], "anobserv": 11, "stack": [11, 14, 19], "roll": [11, 14, 33, 101], "grayscaleobserv": [11, 14], "grai": [11, 13], "scale": [11, 13, 15, 20, 86, 94, 95, 96, 97, 103, 104, 105], "humanrend": [11, 13], "normalizeobserv": [11, 14], "center": [11, 14, 85, 86, 89, 92, 94, 95, 97, 98, 105, 108], "unit": [11, 14, 54, 88, 90, 91, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "varianc": [11, 14, 15], "normalizereward": [11, 15], "averag": [11, 15, 18, 97], "pixelobservationwrapp": [11, 14], "augment": [11, 14], "obtain": [11, 13, 16, 18, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 92, 107], "ad": [11, 13, 14, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 48, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 86, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 110], "replac": [11, 107], "recordepisodestatist": [11, 13], "recordvideo": [11, 13], "rollout": [11, 13, 110], "save": [11, 13], "rescal": [11, 16], "resizeobserv": [11, 14], "axbxc": [11, 14], "resiz": [11, 13], "timeawareobserv": [11, 14, 16], "trajectori": [11, 14, 15, 86, 97, 98], "append": [11, 14], "transformobserv": [11, 14], "transformreward": [11, 15], "th": [11, 19], "sometim": [11, 15, 16, 17, 19], "still": [11, 20], "let": [11, 12, 15, 16, 17, 20, 35, 105], "penal": [11, 71], "energi": [11, 84, 86, 89, 105], "weight": [11, 18, 19, 94, 95, 96, 97, 101, 102, 103, 104, 105], "those": [11, 19, 22, 24, 25, 26, 27, 28, 31, 33, 35, 36, 40, 42, 43, 44, 45, 54, 57, 59, 60, 61, 63, 64, 66, 71, 73, 74, 76, 77, 78, 80, 81, 88, 93, 94, 95, 96, 97, 98, 99, 100, 104], "nevertheless": 11, "reacherrewardwrapp": 11, "reward_dist_weight": 11, "reward_ctrl_weight": 11, "reward_dist": [11, 101, 102], "reward_ctrl": [11, 101, 102], "suffici": [11, 26, 28, 30, 32, 37], "simpli": [12, 13, 14, 15, 17, 20, 108], "overwrit": [12, 14, 15], "domain": [12, 85, 88, 90, 91, 105, 110], "sai": [12, 13, 16], "discreteact": 12, "disc_to_cont": 12, "act": 12, "__name__": [12, 19], "__main__": [12, 19], "print": [12, 17], "among": [12, 14, 87, 93], "biped": [12, 83, 97, 98], "walker": [12, 83, 93, 102, 104], "affin": [12, 86], "75": [12, 94], "noop_max": 13, "frame_skip": [13, 94, 95, 96, 97, 103, 104], "screen_siz": 13, "84": [13, 94, 97, 98], "terminal_on_life_loss": 13, "grayscale_ob": 13, "grayscale_newaxi": 13, "scale_ob": 13, "2600": [13, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "guidelin": 13, "machado": [13, 20], "et": [13, 20], "al": [13, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "2018": [13, 20, 88], "revisit": [13, 20], "arcad": [13, 20, 27, 44, 46, 47, 48, 49, 50, 105], "evalu": [13, 20, 105], "protocol": [13, 20], "open": [13, 16, 17, 20, 33, 93, 105], "problem": [13, 18, 20, 86, 89, 92, 99, 100, 103, 107, 110, 111], "stage": 13, "op": 13, "pool": [13, 103], "recent": [13, 14, 15, 105], "life": [13, 26, 40, 44, 68, 72], "lost": [13, 29, 37, 56, 69, 73], "loss": [13, 107], "off": [13, 16, 37, 52, 60, 68, 85, 86, 110], "Not": 13, "squar": [13, 14, 17, 69, 101, 102, 110], "210x180": 13, "84x84": 13, "grayscal": [13, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "colour": [13, 85], "greyscal": 13, "255": [13, 14, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 85], "No": [13, 88, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "frequenc": 13, "experi": [13, 94, 97, 98, 99, 100, 105], "whenev": [13, 17, 26, 29], "channel": 13, "axi": [13, 19, 90, 91, 95, 97, 98, 103], "dimension": [13, 16, 17, 24, 86, 94, 95, 96, 102, 103, 104, 105], "memori": [13, 14, 90, 91], "optim": [13, 20, 84, 86, 97, 98, 105], "benefit": 13, "opencv": 13, "caus": [13, 53], "new_ob": 13, "final_reward": 13, "final_termin": 13, "final_trunc": 13, "final_don": 13, "prior": [13, 105], "alongsid": [13, 16, 105], "previou": [13, 18, 94, 97, 98], "re": [13, 17, 19, 52, 67, 70], "old_env": 13, "legacyenv": 13, "retun": 13, "modern": [13, 105], "convers": [13, 105], "passiveenvcheck": 13, "cartpoleenv": 13, "customenv": [13, 16], "manual": [13, 16, 20, 46, 47, 48, 49, 50, 105], "unregist": [13, 19], "surround": [13, 105], "test": [13, 17, 84, 105], "haven": 13, "screen": [13, 20, 22, 26, 30, 35, 36, 38, 47, 53, 59, 69, 70, 94, 95, 96, 97, 98, 99, 100, 103, 104], "nativ": [13, 106], "nonativerend": 13, "disable_render_order_enforc": 13, "classic_control": [13, 87], "resetneed": 13, "deque_s": 13, "At": [13, 19, 29, 40, 43, 54], "_episod": 13, "elaps": 13, "sinc": [13, 16, 17, 18, 19, 20, 46, 47, 48, 49, 50, 83, 89, 93, 102, 105, 110], "begin": [13, 17, 26, 29, 42, 67, 68, 69, 70], "num": [13, 20, 22, 24, 25, 26, 27, 28, 31, 33, 35, 36, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 57, 59, 60, 61, 63, 64, 66, 71, 73, 74, 76, 77, 78, 80, 81, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "buffer": [13, 14, 85, 105], "return_queu": 13, "length_queu": 13, "intermitt": 13, "hundredth": 13, "emploi": 13, "stop": [13, 18, 64, 74, 82, 105, 107], "span": 13, "strictli": 13, "pop_fram": 13, "reset_clean": 13, "clear": [13, 74], "issu": [13, 16, 17, 20, 94, 96, 97, 98, 104], "place": [13, 17, 24, 89, 90, 91], "part": [13, 18, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110], "\u01f9one": 13, "intend": [13, 105, 109], "around": [13, 30, 83, 102, 105], "outermost": 13, "actual": [13, 17, 110], "_k": 13, "classic": [13, 16, 18, 86, 88, 89, 90, 91, 92, 96, 100, 103, 104], "reflect": [14, 89], "2d": [14, 102, 105], "navig": [14, 16, 17, 29, 65], "agent_posit": 14, "target_posit": 14, "throw": [14, 16, 55], "awai": [14, 23, 63, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "freedom": [14, 97, 98, 99], "target": [14, 17, 18, 36, 88, 101, 102, 105], "rel": [14, 17, 88, 97, 98], "relativeposit": [14, 17], "ideal": 14, "subclass": 14, "accordingli": [14, 17, 70], "were": [14, 17, 37, 83, 88, 106], "incorrectli": [14, 18], "randn": [14, 19], "08319338": 14, "04635121": 14, "07394746": 14, "20877492": 14, "filter_kei": 14, "00067088": 14, "01860439": 14, "04772898": 14, "01911527": 14, "04560107": 14, "04466959": 14, "0328232": 14, "02367178": 14, "04649447": 14, "14996664": 14, "03329664": 14, "25847703": 14, "96": [14, 20, 85], "27648": 14, "num_stack": 14, "lz4_compress": 14, "lazyfram": 14, "fill": [14, 17, 29], "lz4": 14, "compress": 14, "keep_dim": 14, "uint8": [14, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "singleton": 14, "axbx1": 14, "axb": 14, "epsilon": [14, 15, 105], "1e": [14, 15, 97, 103, 104], "08": [14, 15], "past": [14, 15], "newli": [14, 15], "stabil": [14, 15, 97, 98], "pixels_onli": 14, "render_kwarg": 14, "pixel_kei": 14, "choos": [14, 17, 19], "odict_kei": 14, "400": [14, 110], "600": [14, 105], "discard": 14, "assertionerror": 14, "show": [14, 20, 30, 36, 107], "typeerror": 14, "unexpect": 14, "64": [14, 20], "03810719": 14, "03522411": 14, "02231044": 14, "01088205": 14, "03881167": 14, "16021058": 14, "0220928": 14, "28875574": 14, "becaus": [15, 16, 17, 19], "intrins": 15, "gain": [15, 30, 66, 72, 73, 76], "numer": [15, 98, 99, 100, 107], "clipreward": 15, "min_reward": 15, "max_reward": 15, "invari": 15, "incorrect": [15, 18], "gamma": [15, 18], "99": 15, "discount": [15, 18], "factor": 15, "veri": [16, 17, 86, 101, 105], "easi": [16, 56, 105, 106], "loop": [16, 19, 105], "torqu": [16, 84, 88, 92, 94, 95, 96, 97, 98, 101, 102, 103, 104], "motor": [16, 84, 103], "exchang": 16, "manipul": [16, 105], "robot": [16, 18, 32, 82, 84, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "succe": 16, "toward": [16, 28, 52, 103], "did": [16, 18], "yet": 16, "train": [16, 110], "maxim": 16, "accumul": [16, 42], "crash": [16, 86], "succeed": 16, "onward": [16, 18], "earlier": [16, 17], "someth": 16, "similarli": [16, 19, 86], "previous": [16, 20, 29], "core": [16, 105], "inher": [16, 18], "failur": [16, 18], "explain": 16, "retain": 16, "toggl": 16, "explicitli": [16, 17, 18], "saniti": 16, "util": [16, 17, 19], "seem": 16, "mistak": 16, "best": [16, 20, 46, 47, 48, 49, 50, 105], "practic": [16, 18, 20, 46, 47, 48, 49, 50, 105], "reus": 16, "our": [16, 17, 105], "simpl": [16, 18, 84, 106, 108, 111], "6952509": 16, "4399011": 16, "7981693": 16, "li": [16, 105], "lie": 16, "markov": [16, 18], "aspect": [16, 18], "pong": [16, 20, 35, 39], "k_left": 16, "k_right": 16, "constant": [16, 31, 70, 86, 91, 94, 96, 97, 104], "furthermor": 16, "gameplai": 16, "document": [17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 87, 94, 97, 98, 99, 106], "overview": 17, "relev": 17, "design": [17, 53, 88, 94, 97, 98, 106, 110], "clone": [17, 105], "virtual": [17, 105], "git": 17, "venv": 17, "bin": 17, "activ": [17, 69], "concern": 17, "readm": 17, "setup": 17, "gym_exampl": 17, "grid_world": 17, "relative_posit": 17, "reacher_weighted_reward": 17, "discrete_act": 17, "clip_reward": 17, "illustr": [17, 18], "simplist": 17, "gridworldenv": 17, "grid": [17, 24, 105, 110], "vertic": [17, 26, 84, 99, 100, 105], "horizont": [17, 26, 36, 84, 86, 88], "cell": [17, 105, 108], "locat": [17, 20, 56, 105, 110], "movement": [17, 98], "soon": [17, 110], "spars": [17, 88, 105], "blue": [17, 48, 50, 75, 88], "red": [17, 44, 50], "piec": 17, "abstract": 17, "shouldn": 17, "framer": [17, 20, 98, 101, 102], "window_s": 17, "512": 17, "encod": [17, 108, 110], "direct": [17, 68, 70, 88, 89, 90, 91, 94, 96, 97, 99, 100, 104, 105, 109], "walk": [17, 97, 104, 106, 109], "_action_to_direct": 17, "assert": 17, "clock": 17, "remain": [17, 18, 51, 54, 55, 70, 94, 108], "privat": [17, 39, 65], "_get_ob": 17, "translat": [17, 94, 97, 98], "mandatori": 17, "_agent_loc": 17, "_target_loc": 17, "manhattan": 17, "distanc": [17, 28, 45, 95], "_get_info": 17, "oftentim": 17, "determinist": [17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 88, 90, 91, 108, 110], "worri": 17, "coincid": 17, "array_equ": 17, "_render_fram": 17, "trivial": 17, "gather": [17, 44, 65], "leav": [17, 29, 89, 93, 99], "els": [17, 96, 104, 109], "approach": [17, 99], "skeleton": 17, "init": [17, 85], "set_mod": 17, "canva": 17, "surfac": [17, 46, 70, 99, 100], "pix_square_s": 17, "rect": 17, "circl": [17, 25], "gridlin": 17, "width": 17, "visibl": 17, "blit": 17, "get_rect": 17, "pump": 17, "predefin": [17, 105], "delai": 17, "stabl": 17, "tick": 17, "surfarrai": 17, "pixels3d": 17, "bother": 17, "detect": 17, "put": 17, "registr": 17, "300": [17, 33, 45, 84], "compon": 17, "appropri": [17, 19], "apart": [17, 44], "entrypoint": 17, "mere": 17, "extra": [17, 24, 29, 30, 32, 36, 38, 51, 70, 105], "third": 17, "parti": 17, "codebas": 17, "librari": [17, 105, 106, 111], "edit": 17, "configur": [17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 87, 93, 105, 106], "setuptool": 17, "install_requir": 17, "local": 17, "perfectli": 17, "fine": 17, "variant": [17, 85], "instruct": [17, 93], "touch": [17, 32, 65], "top": [17, 20, 35, 40, 47, 53, 55, 69, 85, 86, 87, 90, 91, 96, 99, 100, 104], "big": [17, 25, 46], "advantag": [17, 94, 105], "job": [17, 28], "definit": [18, 94, 96, 97], "success": [18, 43, 88, 110], "fall": [18, 40, 42, 62, 68, 84, 97, 109], "notabl": 18, "preserv": 18, "decis": [18, 105], "infinit": [18, 86, 96, 104, 107], "obviou": 18, "forev": 18, "forcibli": 18, "halt": 18, "idea": 18, "estim": [18, 94], "tell": 18, "abl": [18, 70], "formal": 18, "q_": 18, "o_t": 18, "a_t": 18, "r_t": 18, "max_a": 18, "o_": 18, "a_": 18, "q_target": 18, "deep": [18, 105], "distinct": 18, "becom": [18, 69, 83, 105], "frequent": 18, "differenti": 18, "shown": [18, 55, 85, 88], "vf_target": 18, "vf_next_stat": 18, "happen": [18, 69, 90, 91, 94, 96, 97, 98, 99, 100, 101, 102, 104], "suppli": [18, 36, 60], "sequenti": 19, "regist": [19, 20], "meant": 19, "basic": 19, "These": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 93, 94, 97, 103, 105, 106], "graviti": [19, 86, 89, 90, 92, 99, 100, 105], "exact": [19, 20, 33, 46, 47, 48, 49, 50, 107], "forkserv": 19, "standard": [19, 52, 94, 95, 99, 105], "02792548": 19, "04423395": 19, "00026012": 19, "04486719": 19, "04906582": 19, "02779809": 19, "02881928": 19, "04467649": 19, "0036706": 19, "00324916": 19, "047668": 19, "02039891": 19, "00187507": 19, "18986781": 19, "03168437": 19, "301252": 19, "02643229": 19, "18816885": 19, "04371385": 19, "3034975": 19, "02803041": 19, "24251814": 19, "02660446": 19, "29707024": 19, "regardless": [19, 94, 95, 96, 97, 103, 104], "arbitrarili": 19, "thereof": 19, "dictenv": 19, "fire": [19, 20, 22, 24, 25, 27, 28, 31, 33, 35, 36, 46, 47, 48, 49, 50, 53, 60, 61, 63, 64, 66, 67, 69, 70, 73, 74, 76, 78, 80, 81, 86], "jump": [19, 53, 68, 71], "acceler": [19, 85, 90, 91, 92], "5337036": 19, "7439302": 19, "41748118": 19, "9373266": 19, "5780453": 19, "8987405": 19, "917269": 19, "5888639": 19, "812942": 19, "23626241": 19, "0616814": 19, "4057572": 19, "4875375": 19, "26341468": 19, "72282314": 19, "3rd": 19, "fell": 19, "hole": [19, 62, 109], "is_slipperi": [19, 109], "prob": 19, "_prob": 19, "pair": [19, 97, 98], "_kei": 19, "logical_or": 19, "11350546": 19, "8090094": 19, "23710881": 19, "8017728": 19, "_final_observ": 19, "equal": [19, 90, 91, 99, 107, 109], "handi": 19, "thank": 19, "whole": 19, "scipi": 19, "special": [19, 23, 53], "softmax": [19, 105], "logit": 19, "argmax": [19, 110], "sent": 19, "expens": 19, "transfer": [19, 105], "cost": [19, 84, 95, 96, 103, 104, 105], "increas": [19, 42, 70, 86, 88, 89, 96, 103, 104], "throughput": 19, "breakoutnoframeskip": 19, "timeit": 19, "23": [19, 94, 97, 98, 101, 105], "136": 19, "\u00b5": 19, "std": 19, "36": [19, 20, 35, 97, 98], "15": [19, 20, 43, 46, 47, 48, 49, 50, 54, 73, 86, 94, 95, 97, 98, 101, 104, 105, 109], "plan": [19, 105], "try": [19, 22, 23, 24, 33, 35, 40, 63, 64], "errorenv": 19, "shut": 19, "raw": 19, "smilesenv": 19, "whose": [19, 105, 107], "smile": 19, "notat": 19, "molecular": 19, "symbol": [19, 105], "__eq__": 19, "co": [19, 88, 90, 91, 92, 99, 102, 105], "_state": 19, "pickleabl": 19, "stella": 20, "adventur": [20, 39], "air": [20, 39], "raid": [20, 39], "alien": [20, 39, 41, 61, 74], "amidar": [20, 28, 39], "assault": [20, 39], "asterix": [20, 39], "asteroid": [20, 39], "atlanti": [20, 39], "bank": [20, 39, 67], "heist": [20, 39], "licens": [20, 105], "download": [20, 105], "agre": 20, "todo": 20, "legal": [20, 46, 47, 48, 49, 50], "upright": [20, 26, 27, 31, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 59, 89, 92, 99, 100], "upleft": [20, 26, 27, 31, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 59], "downright": [20, 26, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 57, 59], "downleft": [20, 26, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 57, 59], "upfir": [20, 24, 27, 33, 46, 47, 48, 49, 50, 64, 76, 77, 78, 80, 81], "11": [20, 27, 46, 47, 48, 49, 50, 54, 57, 94, 95, 96, 97, 98, 99, 101, 102, 104, 107, 108], "rightfir": [20, 22, 24, 25, 27, 28, 31, 36, 46, 47, 48, 49, 50, 54, 57, 60, 61, 63, 73, 76, 77, 80, 81], "leftfir": [20, 22, 24, 25, 27, 28, 36, 46, 47, 48, 49, 50, 54, 57, 60, 61, 63, 73, 76, 77, 80, 81], "13": [20, 27, 46, 47, 48, 49, 50, 54, 57, 94, 95, 97, 98, 101, 104], "downfir": [20, 24, 27, 33, 46, 47, 48, 49, 50, 54, 57, 61, 64, 76, 78, 81], "uprightfir": [20, 27, 46, 47, 48, 49, 50, 54, 57], "upleftfir": [20, 27, 46, 47, 48, 49, 50, 54, 57], "16": [20, 29, 32, 35, 41, 46, 47, 48, 49, 50, 54, 92, 94, 95, 97, 98, 101, 104, 105, 109], "downrightfir": [20, 46, 47, 48, 49, 50, 54, 57], "17": [20, 32, 46, 47, 48, 49, 50, 54, 94, 95, 97, 98, 101, 104, 107], "downleftfir": [20, 46, 47, 48, 49, 50, 54, 57], "smaller": [20, 25, 27, 46, 47, 48, 49, 50], "enumer": [20, 46, 47, 48, 49, 50], "expand": [20, 46, 47, 48, 49, 50], "full": [20, 46, 47, 48, 49, 50, 85, 86], "full_action_spac": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "reduc": [20, 22, 24, 25, 26, 27, 28, 31, 33, 35, 36, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 57, 59, 60, 61, 63, 64, 66, 71, 73, 74, 76, 77, 78, 80, 81, 89], "difficulti": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 105], "choic": 20, "player": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 107], "128": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "byte": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "ram": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "consol": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "atariag": [20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 75, 77, 78, 79, 80, 81, 82], "art": 20, "memor": 20, "sticki": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "small": [20, 50, 69, 84, 105, 106], "On": [20, 61, 88, 89, 90, 91, 92], "repeat": [20, 101], "frameskip": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "exclus": 20, "tabl": [20, 23, 24, 26, 40, 42, 97, 98, 101], "obs_typ": 20, "Its": 20, "repeat_action_prob": [20, 46, 47, 48, 49, 50], "stick": [20, 29, 51, 107], "ll": [20, 53, 70], "sound": [20, 105], "lock": 20, "emul": 20, "proper": 20, "audio": 20, "v5": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "outlin": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 107], "variat": 20, "amidardeterminist": 20, "amidarnoframeskip": 20, "ramdeterminist": 20, "ramnoframeskip": 20, "suffix": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "noframeskip": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "airraid": [20, 22], "31": [20, 27, 97, 98], "bankheist": [20, 29], "20": [20, 29, 35, 62, 70, 86, 94, 97, 98, 101, 105, 110], "24": [20, 29, 35, 60, 84, 85, 86, 89, 94, 97, 98], "28": [20, 29, 35, 88, 97, 98], "battlezon": [20, 30], "beamrid": [20, 31], "berzerk": [20, 39], "18": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 94, 95, 97, 98, 101, 104], "bowl": [20, 39], "breakout": [20, 39], "32": [20, 35, 52, 97, 98, 107], "40": [20, 35, 60, 97, 98], "44": [20, 35, 97, 98], "carniv": [20, 39], "centiped": [20, 39], "22": [20, 37, 94, 97, 98, 101], "86": [20, 37], "choppercommand": [20, 38], "crazyclimb": [20, 40], "defend": [20, 28, 39, 44, 60, 72], "demonattack": [20, 42], "doubledunk": [20, 43], "elevatoract": [20, 44], "enduro": [20, 39], "fishingderbi": 20, "freewai": [20, 39], "frostbit": [20, 39], "gopher": [20, 39], "gravitar": [20, 39], "hero": [20, 39], "icehockei": 20, "jamesbond": [20, 39], "journeyescap": 20, "kangaroo": [20, 39], "krull": [20, 39], "kungfumast": [20, 57], "montezumareveng": [20, 58], "mspacman": [20, 59], "namethisgam": [20, 60], "phoenix": [20, 39], "pitfal": [20, 39, 84], "pooyan": [20, 39], "50": [20, 54, 64, 70, 86, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "70": [20, 64], "privateey": 20, "qbert": [20, 39], "riverraid": [20, 39], "roadrunn": [20, 68], "robotank": [20, 39, 69], "seaquest": [20, 39], "ski": [20, 39], "solari": [20, 39], "spaceinvad": 20, "stargunn": 20, "tenni": [20, 39], "timepilot": 20, "tutankham": [20, 39], "upndown": [20, 78], "ventur": [20, 39], "videopinbal": [20, 80, 81], "wizardofwor": [20, 81], "yarsreveng": 20, "zaxxon": [20, 39], "oppos": 20, "ai": 20, "mg": 20, "bellemar": 20, "naddaf": 20, "veness": 20, "platform": [20, 105], "journal": 20, "artifici": 20, "intellig": 20, "research": [20, 93, 99, 105], "2012": 20, "url": 20, "jair": 20, "php": 20, "articl": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "view": [20, 50, 105], "11182": 20, "250": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "160": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "enchant": [21, 37], "chalic": 21, "golden": 21, "castl": 21, "pick": [21, 44, 55, 68, 110], "sword": 21, "bridg": [21, 67, 105], "magnet": 21, "fight": [21, 34, 57, 60, 105], "outmanoeuvr": 21, "dragon": 21, "flavor": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "switch": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 105], "thorough": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "discuss": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "intric": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "stochast": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 87, 88, 90, 91, 93, 94, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105, 110], "ship": [22, 23, 25, 31, 41, 50, 72], "sidewai": [22, 25, 31, 67, 71], "protect": [22, 28, 37, 38, 49, 54, 64], "fly": [22, 27, 51, 67, 86], "saucer": [22, 27, 74], "drop": [22, 29, 110], "bomb": [22, 41, 53, 61, 74], "meaning": [22, 24, 25, 26, 27, 28, 31, 33, 35, 36, 40, 42, 43, 44, 45, 54, 57, 59, 60, 61, 63, 64, 66, 71, 73, 74, 76, 77, 78, 80, 81], "210": [23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 41, 42, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], "stuck": [23, 32, 51], "maze": [23, 24, 29, 32, 58, 77], "destroi": [23, 25, 27, 28, 29, 30, 31, 32, 35, 36, 37, 38, 41, 42, 50, 56, 67, 68, 69, 72, 73, 74, 76, 86], "egg": 23, "scatter": [23, 65], "simultan": [23, 24], "kill": [23, 32, 51, 56], "flamethrow": 23, "tricki": 23, "situat": [23, 110], "occasion": [23, 27], "power": [23, 51, 85, 86, 91, 99, 100, 105], "pulsar": 23, "temporari": 23, "abil": 23, "score": [23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 51, 52, 53, 54, 55, 56, 62, 63, 64, 65, 66, 67, 68, 70, 74, 75, 76, 80, 84, 86], "prize": [23, 78], "caught": [23, 29], "lose": [23, 26, 28, 37, 40, 41, 44, 51, 53, 62, 63, 65, 67, 68, 70, 71, 72, 86, 107], "consult": [23, 52, 53, 54, 55, 56], "pac": 24, "man": 24, "visit": [24, 44, 85], "enemi": [24, 25, 28, 30, 31, 32, 38, 41, 42, 44, 57, 66, 67, 69, 70, 72, 73, 74, 76, 82], "chicken": [24, 36, 47], "catch": [24, 40, 46, 68], "travers": 24, "vehicl": [25, 30, 45, 54, 105], "mother": [25, 55, 64], "overhead": [25, 86], "deploi": 25, "drone": 25, "dodg": [25, 31, 70], "attack": [25, 27, 28, 31, 39, 41, 64], "lyre": 26, "guid": [26, 47, 105], "award": [26, 32, 37, 40, 44, 70, 99, 100], "spaceship": [27, 41, 72], "field": [27, 105], "break": [27, 35, 85], "appear": [27, 29, 32, 69, 90, 91], "satellit": 27, "ufo": 27, "submerg": 28, "citi": [28, 29, 65, 105], "slowli": 28, "descend": 28, "strike": [28, 33], "defens": [28, 43], "post": 28, "manag": [28, 33], "seven": 28, "fought": 28, "wave": [28, 38, 42, 54, 61, 74], "outer": [28, 88], "robber": 29, "natur": [29, 107, 109], "rob": 29, "getawai": 29, "car": [29, 45, 83, 87, 105], "polic": 29, "chase": [29, 32], "dynamit": [29, 51], "ga": [29, 85], "tank": [29, 30, 70], "four": [29, 40, 85, 86, 94, 96, 104, 110], "nine": [29, 94], "person": [30, 88, 105], "perspect": [30, 105], "3d": [30, 94, 97, 98, 105], "illus": 30, "radar": [30, 81], "travel": 31, "steer": [31, 78, 85], "debri": 31, "leftifir": 31, "evil": [32, 57, 82], "wall": [32, 35, 51, 90, 91], "undefeat": 32, "otto": 32, "tri": 33, "knock": [33, 34], "pin": 33, "spar": 33, "spare": 33, "oppon": [34, 46, 52, 63, 78], "ring": 34, "hit": [34, 35, 36, 37, 42, 64, 65, 68, 69, 71, 107], "land": [34, 68, 86], "punch": [34, 55], "famou": 35, "paddl": [35, 63], "ball": [35, 52, 63, 80], "brick": 35, "wreak": 35, "havoc": 35, "five": [35, 65, 71, 87], "214": 36, "em": 36, "gun": [36, 44], "ammunit": 36, "steal": [36, 46], "bullet": [36, 105], "subtract": 36, "minu": 36, "sign": [36, 99, 100], "elf": 37, "magic": 37, "wand": 37, "fend": 37, "spider": 37, "flea": 37, "mushroom": 37, "forest": 37, "bitten": 37, "tempor": 37, "paralyz": 37, "scorpion": 37, "round": 37, "helicopt": [38, 40, 67], "truck": [38, 68], "convoi": 38, "aircraft": [38, 76], "mini": 38, "bottom": [38, 53, 85, 90, 91, 96, 104, 108], "plane": 38, "surviv": [38, 42], "battl": 39, "zone": 39, "beam": [39, 51], "rider": 39, "chopper": 39, "command": [39, 93], "crazi": 39, "climber": 39, "demon": 39, "doubl": [39, 93], "dunk": 39, "elev": 39, "fish": 39, "derbi": 39, "ic": [39, 42, 48, 52], "hockei": [39, 52], "journei": [39, 54], "kung": 39, "fu": 39, "master": [39, 93, 108], "montezuma": 39, "reveng": 39, "pacman": 39, "ey": [39, 60, 65, 105], "road": [39, 85], "runner": 39, "invad": [39, 73], "star": 39, "gunner": 39, "pilot": [39, 61, 82], "pinbal": 39, "wizard": [39, 57], "Of": 39, "wor": 39, "yar": 39, "builid": 40, "obstacl": [40, 54, 55], "damag": [40, 69], "climb": [40, 55, 87, 105], "fast": [40, 85, 93, 95, 97, 99, 103, 105], "least": [40, 75, 86], "row": [40, 73, 108, 109], "earth": [41, 73], "rescu": [41, 51, 55, 56, 57, 70, 72], "smart": 41, "shot": [41, 43, 44, 52, 53, 68, 105], "abduct": 41, "unlimit": 41, "laser": [41, 51, 73, 81], "missil": [41, 67], "aliv": [41, 97, 104], "face": [42, 94, 97, 98, 107], "planet": [42, 50, 72], "krybor": 42, "reserv": [42, 67, 69, 70], "bunker": [42, 50], "grant": [42, 86], "slai": 42, "2v2": 43, "basketbal": 43, "possess": 43, "rival": 43, "team": 43, "rule": [43, 75, 105, 107], "foul": 43, "secret": [44, 65], "ground": [44, 64, 84, 86, 94, 98, 105], "stair": 44, "equip": 44, "against": [44, 63, 75, 105], "floor": 44, "mark": 44, "door": [44, 105], "unreleas": 44, "prototyp": 44, "500": [44, 67, 88, 89, 110], "racer": 45, "nation": 45, "long": [45, 80, 89, 99, 100], "endur": 45, "race": [45, 68, 71, 83], "overtak": 45, "dai": [45, 83], "stai": 45, "meet": 45, "quota": 45, "sunfish": 46, "than": [46, 52, 70, 86, 88, 89, 90, 91, 95, 99, 100, 101, 103, 105, 107], "But": [46, 71], "fisherman": 46, "black": [46, 56, 88], "shark": [46, 60, 70], "lurk": [46, 66], "lane": [47, 105], "busi": 47, "rush": 47, "hour": 47, "traffic": 47, "cross": [47, 109], "bailei": 48, "who": [48, 49, 54, 55, 71], "hop": [48, 66, 96, 104], "forth": 48, "arctic": 48, "river": [48, 67], "block": [48, 105], "white": 48, "he": [48, 50], "hi": [48, 50, 65], "igloo": 48, "shovel": 49, "wield": 49, "farmer": 49, "crop": 49, "carrot": 49, "spacecraft": 50, "fiction": 50, "solar": 50, "system": [50, 88, 92, 99, 100, 105], "landscap": 50, "miner": 51, "mine": [51, 68], "shaft": 51, "tool": [51, 58], "propel": 51, "backpack": 51, "wherev": 51, "blast": [51, 70, 72], "vermin": 51, "raft": 51, "stretch": 51, "critter": 51, "minut": [52, 62], "period": [52, 96, 104], "puck": 52, "angl": [52, 53, 84, 86, 88, 89, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "extrem": [52, 105, 106], "aim": [52, 96, 99, 103, 104], "rink": 52, "realli": 52, "mr": 53, "bond": 53, "multipurpos": 53, "craft": [53, 86], "varieti": [53, 105], "motion": [53, 105], "slightli": [53, 84, 94], "dive": 53, "lob": 53, "rate": [53, 70], "highest": [53, 105], "novic": 53, "006": 53, "007": 53, "lead": 54, "peski": 54, "backstag": 54, "scarab": 54, "000": [54, 67, 70], "concert": 54, "cash": 54, "grasp": 54, "groupi": 54, "photograph": 54, "promot": 54, "encount": [54, 55, 76, 105], "her": [55, 64], "preciou": 55, "babi": 55, "ladder": [55, 84], "bonu": [55, 69, 70, 74, 104], "fruit": 55, "monkei": 55, "corner": 55, "beast": 56, "fortress": [56, 58], "princess": [56, 57], "lyssa": 56, "sunris": 56, "monster": [56, 79], "templ": 57, "victoria": 57, "defeat": [57, 66], "acquir": [58, 93], "treasur": [58, 60, 62, 77, 79], "chamber": [58, 79], "emperor": 58, "deadli": 58, "creatur": [58, 66, 74, 105], "valuabl": 58, "pellet": 59, "ghost": 59, "discov": 60, "octopu": 60, "oxygen": [60, 70], "elimin": [61, 77, 78, 79], "war": 61, "bird": 61, "harri": 62, "jungl": 62, "die": [62, 64, 85], "misfortun": 62, "compet": 63, "deflect": 63, "pig": 64, "piglet": 64, "wolv": 64, "rope": 64, "balloon": 64, "guard": 64, "safe": [64, 86], "eat": [64, 68], "bait": 64, "wolf": 64, "stone": 64, "rock": [64, 68], "french": 65, "pierr": 65, "street": 65, "park": 65, "passag": 65, "dead": 65, "search": [65, 105], "ringlead": 65, "henri": 65, "le": 65, "fiend": 65, "gang": 65, "evid": 65, "stolen": 65, "good": 65, "statut": 65, "expir": 65, "nab": 65, "question": [65, 105], "auto": 65, "pothol": 65, "bert": 66, "cube": 66, "pyramid": 66, "destin": [66, 110], "nasti": 66, "jet": 67, "fli": 67, "fuel": [67, 72, 86], "depot": 67, "collid": [67, 70, 86], "squadron": [67, 69], "tanker": 67, "80": 67, "tm": 68, "outrun": 68, "wile": 68, "coyot": 68, "hazard": 68, "desert": 68, "rocket": [68, 69, 86], "cannon": [68, 73], "cliff": [68, 106], "steel": 68, "pile": 68, "birdse": 68, "cannonbal": 68, "scrambl": 69, "static": 69, "interfer": 69, "sensor": [69, 85], "report": [69, 84, 94, 97, 98], "flash": 69, "panel": 69, "earn": 69, "twelv": 69, "torpedo": 70, "diver": 70, "killer": 70, "deliv": [70, 110], "six": [70, 104], "explod": 70, "anyth": 70, "decreas": [70, 86], "almost": 70, "yoursub": 70, "blow": 70, "forc": [70, 72, 86, 89, 90, 91, 94, 97, 98, 99, 100], "less": [70, 84, 86, 99, 103], "worth": [70, 73], "90": 70, "moment": 70, "skier": 71, "gate": [71, 105], "fastest": 71, "miss": [71, 88, 110], "tree": [71, 93], "slalom": 71, "penalti": 71, "warp": 72, "sector": 72, "feder": [72, 105], "zylon": 72, "refuel": 72, "cadet": 72, "corridor": 72, "mania": [74, 76], "orang": 75, "win": [75, 107], "margin": 75, "ti": 75, "sport": 75, "till": 75, "technologi": 76, "increasingli": 76, "futur": 76, "difficult": [76, 89, 93, 99, 100], "rack": 77, "tomb": 77, "guardian": 77, "baja": 78, "bugger": 78, "dungeon": 79, "beat": [81, 107], "scanner": 81, "armi": 82, "enslav": 82, "galaxi": 82, "fighter": 82, "lunar": 83, "lander": 83, "toi": [83, 105, 107, 108, 109, 110], "contribut": 83, "earli": [83, 105], "oleg": [83, 84, 85, 86], "klimov": [83, 84, 85, 86], "popular": [83, 105], "benchmark": [83, 105], "ever": 83, "joint": [84, 86, 88, 89, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "uneven": 84, "terrain": [84, 105], "hardcor": 84, "stump": 84, "1600": 84, "heurist": [84, 86], "demonstr": 84, "hip": [84, 94, 97, 98], "knee": [84, 97, 98], "hull": 84, "angular": [84, 86, 88, 89, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "leg": [84, 86, 94, 96, 97, 98, 104, 105], "contact": [84, 86, 93, 94, 97, 98, 99], "lidar": [84, 105], "rangefind": 84, "measur": [84, 92, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104, 105], "far": [84, 85, 99, 101, 102, 105], "better": 84, "stand": [84, 93, 94, 97, 98, 99, 100], "slight": 84, "exce": [84, 107], "closest": 84, "trace": 84, "furthest": 84, "faster": [84, 86, 98], "spent": [84, 86], "higher": 84, "friction": [84, 103, 105], "nervous": 84, "easiest": 85, "ab": [85, 105], "wheel": 85, "gyroscop": 85, "car_rac": 85, "rear": 85, "drive": [85, 110], "noth": [85, 86], "brake": 85, "96x96": 85, "tile": 85, "732": 85, "926": 85, "rest": [85, 86, 96, 104], "playfield": 85, "lap_complete_perc": 85, "dictat": [85, 86], "percentag": 85, "lap": 85, "domain_random": 85, "scenario": [85, 105], "background": 85, "demand": 85, "correspondingli": 85, "scheme": [85, 105], "chri": 85, "campbel": 85, "2014": 85, "www": 85, "iforce2d": 85, "net": [85, 107], "b2dtut": 85, "pontryagin": 86, "principl": 86, "engin": [86, 93], "throttl": 86, "why": 86, "pad": 86, "lunar_land": 86, "orient": [86, 94, 97, 98], "sum": [86, 94, 95, 96, 97, 98, 101, 102, 103, 104, 105, 107], "closer": [86, 107], "slower": 86, "tilt": 86, "03": 86, "solut": 86, "viewport": 86, "mass": [86, 94, 95, 97, 98, 103, 105], "bodi": [86, 93, 94, 95, 96, 97, 98, 99, 100, 103, 104], "moon": 86, "greater": [86, 88, 89, 90, 91, 95, 100, 101, 103, 107], "awak": 86, "group": 86, "come": [86, 94, 95, 96, 97, 98, 99, 100, 103, 104, 105], "sleep": 86, "littl": [86, 98], "cpu": 86, "wake": 86, "attach": [86, 89, 92, 94, 104], "enable_wind": 86, "wind_pow": 86, "turbulence_pow": 86, "later": 86, "booster": 86, "gravit": 86, "wind": 86, "tanh": 86, "sin": [86, 92, 99], "pi": [86, 88, 92], "9999": 86, "rotat": [86, 88, 94, 97, 98, 101], "turbul": 86, "renorm": 86, "harder": 86, "push": [86, 89, 99, 100, 105], "cart": [87, 99, 100], "mountain": 87, "nois": [87, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "regard": 87, "underpow": 87, "effort": 87, "easier": 87, "ones": [87, 93], "57": 88, "coars": 88, "barto": [88, 89, 99, 100, 107, 108], "book": [88, 107], "link": [88, 94, 95, 96, 97, 98, 102, 103], "linearli": [88, 99, 100], "actuat": [88, 89, 97, 98], "swing": [88, 92], "free": [88, 92, 93, 94, 97, 98, 99, 100, 105], "height": [88, 96, 99, 104], "hang": 88, "downward": 88, "seen": [88, 95, 105], "green": 88, "cosin": [88, 99, 102], "theta1": 88, "sine": [88, 99, 102], "theta2": 88, "567": 88, "274": 88, "4\u03c0": 88, "9\u03c0": 88, "rad": [88, 89, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "few": 88, "incur": [88, 108], "introduct": [88, 107, 108], "book_or_nip": 88, "neurip": [88, 105], "paper": [88, 99, 105], "nip": [88, 105], "equat": [88, 92], "confirm": 88, "experiment": [88, 105], "radian": [88, 89, 92, 100], "1996": 88, "touretzki": 88, "mozer": 88, "hasselmo": 88, "ed": [88, 110], "vol": 88, "mit": 88, "proceed": 88, "cc": 88, "1995": 88, "8f1d43620bc6bb580df6e80b0dc05c48": 88, "pdf": 88, "anderson": [89, 99, 100], "neuronlik": [89, 99, 100], "adapt": [89, 99, 100, 108], "That": 89, "un": 89, "frictionless": 89, "balanc": [89, 99, 100], "vari": [89, 99, 100, 105], "418": 89, "untermin": 89, "2095": 89, "allot": 89, "475": 89, "05": [89, 94, 95, 101], "07": [90, 91], "sinusoid": [90, 91], "vallei": [90, 91], "strateg": [90, 91], "hill": [90, 91], "andrew": [90, 91], "moor": [90, 91], "phd": [90, 91, 103], "thesi": [90, 91, 103], "1990": [90, 91], "techreport": [90, 91], "moore90efficientmemori": [90, 91], "author": [90, 91], "william": [90, 91], "institut": [90, 91], "univers": [90, 91], "cambridg": [90, 91], "year": [90, 91], "001": [90, 92, 96, 99, 104], "0025": [90, 91], "collis": [90, 91], "inelast": [90, 91], "upon": [90, 91], "quickli": [90, 105], "penalis": [90, 91, 94, 95, 96, 97, 98, 99, 101, 102, 103, 104], "0015": 91, "45": [91, 98, 101], "999": 91, "invert": [92, 93], "swingup": 92, "theori": [92, 99, 105], "diagram": 92, "meter": 92, "theta": 92, "tau": 92, "counter": 92, "clockwis": 92, "theta_dt": 92, "heta": 92, "2736044": 92, "calcul": [92, 93, 94, 97, 98, 99, 101, 102, 109], "simplifi": [92, 105], "math": 92, "half": 93, "cheetah": 93, "standup": 93, "facilit": [93, 105], "develop": 93, "biomechan": 93, "graphic": [93, 105], "anim": 93, "area": 93, "accur": [93, 105], "octob": 93, "2021": [93, 105], "deepmind": [93, 105], "2022": 93, "everyon": 93, "websit": [93, 105], "framework": 93, "mujoco_pi": [93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "ten": [93, 107], "iverteddoublependulum": 93, "gaussian": 93, "mjsim": 93, "qpo": 93, "qvel": [93, 97, 98], "indirectli": 93, "xml": [93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "tweak": [93, 103], "introduc": [94, 97, 98], "schulman": 94, "moritz": 94, "levin": 94, "jordan": 94, "abbeel": 94, "torso": [94, 95, 96, 97, 98, 104], "eight": 94, "hing": [94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "rotor": [94, 95, 96, 97, 98, 103, 104], "front": [94, 95, 103, 105], "hip_1": [94, 97, 98], "front_left_leg": [94, 97, 98], "angle_1": [94, 97, 98], "hip_2": [94, 97, 98], "front_right_leg": [94, 97, 98], "angle_2": 94, "hip_3": 94, "back_leg": 94, "angle_3": 94, "hip_4": 94, "right_back_leg": 94, "angle_4": 94, "deriv": [94, 95, 96, 97, 98, 99, 100, 103, 104], "exclude_current_positions_from_observ": [94, 95, 96, 97, 103, 104], "113": 94, "x_posit": [94, 95, 96, 97, 103, 104], "y_posit": [94, 97, 103], "111": 94, "centr": [94, 97, 98], "ankle_1": 94, "ankle_2": 94, "ankle_3": 94, "ankle_4": 94, "19": [94, 97, 98, 101], "dof": [94, 97, 98], "quaternion": [94, 97, 98], "healthy_reward": [94, 96, 97, 104], "healthi": [94, 96, 97, 104], "forward_reward": [94, 95, 96, 97, 103, 104], "dt": [94, 95, 96, 97, 101, 102, 103, 104], "frametim": [94, 95, 96, 97, 103, 104], "ctrl_cost": [94, 95, 96, 97, 103, 104], "too": [94, 95, 96, 97, 98, 99, 101, 102, 103, 104], "ctrl_cost_weight": [94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "ctr_cost_weight": 94, "contact_cost": [94, 97], "contact_cost_weight": [94, 97], "contact_force_rang": 94, "reset_noise_scal": [94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "deviat": [94, 95, 99, 103], "intention": [94, 97, 98], "therebi": [94, 97, 98], "said": [94, 96, 97, 104], "unhealthi": [94, 96, 97, 104], "healthy_z_rang": [94, 96, 97, 104], "terminate_when_unhealthi": [94, 96, 97, 104], "xml_file": [94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "path": [94, 95, 96, 97, 101, 102, 103, 104], "model": [94, 95, 96, 97, 103, 104, 105], "5e": [94, 96, 97, 104], "perturb": [94, 95, 96, 97, 103, 104], "exclud": [94, 95, 96, 97, 103, 104], "induct": [94, 95, 96, 97, 103, 104], "bia": [94, 95, 96, 97, 103, 104], "induc": [94, 95, 96, 97, 103, 104], "agnost": [94, 95, 96, 97, 98, 103, 104], "bind": [94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "camera": [94, 95, 96, 97, 98, 99, 100, 103, 104, 105], "max_time_step": [94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "wawrzy\u0144ski": 95, "cat": 95, "paw": 95, "alloc": 95, "backward": 95, "thigh": [95, 96, 97, 98, 104], "shin": [95, 97, 98], "feet": [95, 104], "bthigh": 95, "bshin": 95, "bfoot": 95, "fthigh": 95, "fshin": 95, "ffoot": 95, "tip": [95, 99, 103], "rootz": [95, 96, 104], "slide": [95, 96, 99, 100, 101, 102, 103, 104], "rooti": [95, 96, 104], "rootx": [95, 96, 104], "forward_reward_weight": [95, 96, 97, 103, 104], "half_cheetah": 95, "erez": [96, 97, 98, 104], "tassa": [96, 97, 98, 104], "todorov": [96, 97, 98, 104], "predict": [96, 104], "nonlinear": [96, 104], "compar": [96, 103, 104], "figur": [96, 104], "middl": [96, 104], "thigh_joint": [96, 104], "leg_joint": [96, 104], "foot_joint": [96, 104], "002": [96, 104], "008": [96, 104], "healthy_state_rang": 96, "fallen": 96, "healthy_angle_rang": [96, 104], "376": [97, 98], "synthesi": [97, 98, 105], "onlin": [97, 98, 105], "abdomen": [97, 98], "arm": [97, 98, 101, 102, 105], "elbow": [97, 98, 101], "right_hip_x": [97, 98], "right_thigh": [97, 98], "right_hip_z": [97, 98], "right_hip_i": [97, 98], "right_kne": [97, 98], "left_hip_x": [97, 98], "left_thigh": [97, 98], "left_hip_z": [97, 98], "left_hip_i": [97, 98], "left_kne": [97, 98], "right_shoulder1": [97, 98], "right_shoulder2": [97, 98], "right_elbow": [97, 98], "left_shoulder1": [97, 98], "left_shoulder2": [97, 98], "left_elbow": [97, 98], "378": 97, "root": [97, 98], "lower_waist": [97, 98], "abdomen_z": [97, 98], "abdomen_i": [97, 98], "pelvi": [97, 98], "abdomen_x": [97, 98], "right_upper_arm": [97, 98], "right_lower_arm": [97, 98], "left_upper_arm": [97, 98], "left_lower_arm": [97, 98], "anglular": [97, 98, 100], "29": [97, 98], "aanglular": [97, 98], "33": [97, 98], "34": 97, "35": [97, 98], "37": [97, 98], "39": [97, 98], "41": [97, 98], "43": [97, 98], "velocitti": 97, "addition": [97, 98], "cinert": [97, 98], "inertia": [97, 98], "rigid": [97, 98], "intermedi": [97, 98], "nbodi": [97, 98], "henc": [97, 98, 106], "140": [97, 98], "cvel": [97, 98], "qfrc_actuat": [97, 98], "constraint": [97, 98, 99, 105], "nv": [97, 98], "cfrc_ext": [97, 98], "dim": [97, 98], "003": 97, "015": 97, "nu": [97, 98], "contact_cost_rang": 97, "lai": 98, "state_spac": 98, "uph_cost": 98, "upward": 98, "absolut": [98, 100, 104], "overal": 98, "atom": 98, "though": 98, "inflat": 98, "quad_ctrl_cost": 98, "quad_impact_cost": 98, "000001": 98, "105": 98, "unlik": [98, 99, 100, 101, 102], "beyond": [98, 99, 100, 101, 102, 104], "slider": [99, 100], "unitless": [99, 102], "hinge2": 99, "realist": [99, 105], "accuraci": [99, 105], "analyt": 99, "alive_bonu": 99, "distance_penalti": 99, "velocity_penalti": 99, "005": [99, 101, 102], "y_coordin": 99, "196": 99, "perpendicularli": 99, "cylind": 101, "effector": [101, 102], "fingertip": [101, 102], "shoulder": 101, "forearm": 101, "wrist": 101, "pan": 101, "r_shoulder_pan_joint": 101, "lift": 101, "r_shoulder_lift_joint": 101, "r_upper_arm_roll_joint": 101, "flex": 101, "r_elbow_flex_joint": 101, "r_forearm_roll_joint": 101, "r_wrist_flex_joint": 101, "r_wrist_roll_joint": 101, "analogi": 101, "tips_arm": 101, "obj_slidex": 101, "obj_slidei": 101, "goal_slidex": 101, "goal_slidei": 101, "sphere": 101, "reward_near": 101, "unattach": [101, 102], "reward_control": [101, 102], "euclidean": [101, 102], "perman": 101, "323": 101, "rise": 101, "asset": [101, 102], "gymnasmium": 101, "fixtur": 102, "joint0": 102, "joint1": 102, "target_x": 102, "target_i": 102, "position_fingertip": 102, "position_target": 102, "na": [102, 105], "disk": 102, "radiu": 102, "everyth": 102, "02": 102, "r\u00e9mi": 103, "coulom": 103, "applic": [103, 105], "segment": 103, "articul": [103, 105], "suspend": 103, "subject": [103, 105], "fluid": 103, "viscou": 103, "coeffici": 103, "motor1_rot": 103, "motor2_rot": 103, "\u03b8": 103, "free_body_rot": 103, "slider1": 103, "slider2": 103, "04": 103, "swim": 103, "split": 104, "thigh_left_joint": 104, "leg_left_joint": 104, "foot_left_joint": 104, "ctr_cost": 104, "doom": 105, "focus": 105, "visual": 105, "thousand": 105, "depth": 105, "annot": 105, "label": 105, "2016": 105, "cite": 105, "huge": 105, "3v3": 105, "hundr": 105, "roughli": 105, "tweakabl": 105, "monei": 105, "minecraft": 105, "challeng": 105, "procedur": 105, "generaliz": 105, "skill": 105, "slime": 105, "volleybal": 105, "motiv": 105, "maintain": [105, 111], "premad": 105, "imperfect": 105, "twisti": 105, "puzzl": 105, "weiqi": 105, "famous": 105, "conquer": 105, "alphago": 105, "synthes": 105, "neuro": 105, "architectur": 105, "integr": 105, "twin": 105, "concept": 105, "seamless": 105, "hardwar": 105, "world": [105, 110], "firmwar": 105, "neuroflight": 105, "extens": 105, "ro": 105, "thrust": 105, "ascend": 105, "shall": 105, "altitud": 105, "aerodynam": 105, "drag": 105, "light": 105, "poli": 105, "pinocchio": 105, "meshcat": 105, "web": 105, "minimalist": 105, "interior": 105, "room": 105, "hallwai": 105, "offic": 105, "home": 105, "dmlab": 105, "bitcraz": 105, "crazyfli": 105, "nanoquadrotor": 105, "mar": 105, "endeavor": 105, "gap": 105, "methodologi": 105, "coverag": 105, "commerci": 105, "mac": 105, "linux": 105, "laboratori": 105, "internet": 105, "ego": 105, "cloud": 105, "semant": 105, "project": 105, "cours": 105, "wide": 105, "account": 105, "yield": 105, "voltag": 105, "duti": 105, "cycl": 105, "emphasi": 105, "percept": 105, "social": 105, "driver": 105, "uncertain": 105, "propos": 105, "merg": 105, "intersect": 105, "roundabout": 105, "longitudin": 105, "comprehens": 105, "conduct": 105, "akin": 105, "anomali": 105, "inject": 105, "studi": 105, "robust": 105, "brax": 105, "compil": 105, "llvm": 105, "phase": 105, "gcc": 105, "cuda": 105, "hyperparamet": 105, "cheap": 105, "surrog": 105, "evolutionari": 105, "obsolet": 105, "windygrid": 105, "bandit": 105, "server": 105, "advertis": 105, "greedi": 105, "ucb1": 105, "trade": 105, "great": 105, "focu": 105, "simplic": 105, "autom": 105, "deduct": 105, "verif": 105, "minatar": 105, "metatrad": 105, "unus": 105, "techniqu": 105, "hard": 105, "strive": 105, "novel": 105, "transport": 105, "warehous": 105, "storag": 105, "overfit": 105, "mathemat": 105, "dataset": 105, "arxiv": 105, "2107": 105, "07373": 105, "baselin": 105, "expos": 105, "blockqnn": 105, "wise": 105, "nsc": 105, "cifar": 105, "meta": 105, "tag": 105, "answer": 105, "classif": 105, "omg": 105, "toolbox": 105, "electron": 105, "musculoskelet": 105, "opensim": 105, "physiolog": 105, "competit": 105, "2017": 105, "foss": 105, "interoper": 105, "quantum": 105, "circuit": 105, "wire": 105, "qubit": 105, "googl": 105, "quantumai": 105, "cirq": 105, "quadrotor": 105, "casadi": 105, "priori": 105, "taobao": 105, "largest": 105, "commerc": 105, "morl": 105, "equiti": 105, "market": 105, "acm": 105, "icaif21": 105, "public": 105, "financi": 105, "daili": 105, "investor": 105, "respons": 105, "theorem": 105, "prover": 105, "vampir": 105, "theoret": 105, "workshop": 105, "f1tenth": 105, "unoffici": 105, "baselines3": 105, "trackmania": 105, "2020": 105, "latent": 105, "imagin": 105, "miniatur": 105, "racecar": 105, "portabl": 105, "evolut": 105, "torc": 105, "wireless": 105, "elastica": 105, "assembli": 105, "slender": 105, "cosserat": 105, "rod": 105, "supertuxkart": 105, "accompani": 105, "ostrich": 105, "bio": 105, "mechan": 105, "locomot": 105, "soft": 105, "snake": 105, "propuls": 105, "music": 105, "dual": 105, "dexter": 105, "hand": 105, "isaac": 105, "omnivers": 105, "rust": 105, "jax": 105, "frozen": 106, "lake": 106, "suitabl": 106, "card": 107, "dealer": 107, "jack": 107, "queen": 107, "king": 107, "ac": 107, "usabl": 107, "deck": 107, "decid": [107, 109], "bust": 107, "reveal": 107, "facedown": 107, "goe": 107, "outcom": 107, "incompleteidea": 107, "2nd": 107, "html": 107, "sab": 107, "48": 108, "106": 108, "With": 108, "inspir": 108, "dennybritz": 108, "blob": 108, "cliff_walk": 108, "board": 108, "4x12": 108, "3x12": 108, "fact": 108, "slipperi": 109, "dir": 109, "current_row": 109, "nrow": 109, "current_col": 109, "col": 109, "4x4": 109, "desc": 109, "map_nam": 109, "sfff": 109, "fhfh": 109, "fffh": 109, "hffg": 109, "generate_random_map": 109, "toy_text": 109, "frozen_lak": 109, "preload": 109, "8x8": 109, "sfffffff": 109, "ffffffff": 109, "fffhffff": 109, "fffffhff": 109, "fhhfffhf": 109, "fhffhfhf": 109, "fffhfffg": 109, "perpendicular": 109, "bug": [109, 110], "maxq": 110, "decomposit": 110, "tom": 110, "dietterich": 110, "reen": 110, "ellow": 110, "lue": 110, "passeng": 110, "south": 110, "north": 110, "east": 110, "west": 110, "pickup": 110, "404": 110, "reachabl": 110, "taxi_row": 110, "taxi_col": 110, "passenger_loc": 110, "decod": 110, "action_mask": 110, "Or": 110, "q_valu": 110, "illeg": 110, "cleaner": 110, "disallow": 110, "loc": 110, "passidx": 110, "capabl": 111}, "objects": {"Space": [[4, 0, 1, "", "dtype"]], "": [[10, 1, 1, "", "action_space"], [10, 1, 1, "", "observation_space"], [10, 1, 1, "", "single_action_space"], [10, 1, 1, "", "single_observation_space"]], "gymnasium": [[12, 2, 1, "", "ActionWrapper"], [2, 2, 1, "", "Env"], [14, 2, 1, "", "ObservationWrapper"], [15, 2, 1, "", "RewardWrapper"], [11, 2, 1, "", "Wrapper"], [3, 3, 1, "", "make"], [3, 3, 1, "", "register"], [3, 3, 1, "", "spec"]], "gymnasium.ActionWrapper.ActionWrapper": [[12, 3, 1, "", "action"]], "gymnasium.Env": [[2, 1, 1, "", "action_space"], [2, 3, 1, "", "close"], [2, 1, 1, "", "metadata"], [2, 0, 1, "", "np_random"], [2, 1, 1, "", "observation_space"], [2, 3, 1, "", "render"], [2, 1, 1, "", "render_mode"], [2, 3, 1, "", "reset"], [2, 1, 1, "", "reward_range"], [2, 1, 1, "", "spec"], [2, 3, 1, "", "step"], [2, 0, 1, "", "unwrapped"]], "gymnasium.ObservationWrapper": [[14, 3, 1, "", "observation"]], "gymnasium.RewardWrapper.RewardWrapper": [[15, 3, 1, "", "reward"]], "gymnasium.Wrapper": [[11, 0, 1, "", "action_space"], [11, 3, 1, "", "close"], [11, 0, 1, "", "metadata"], [11, 0, 1, "", "np_random"], [11, 0, 1, "", "observation_space"], [11, 3, 1, "", "reset"], [11, 0, 1, "", "reward_range"], [11, 0, 1, "", "spec"], [11, 3, 1, "", "step"], [11, 0, 1, "", "unwrapped"]], "gymnasium.spaces": [[6, 2, 1, "", "Box"], [5, 2, 1, "", "Dict"], [6, 2, 1, "", "Discrete"], [5, 2, 1, "", "Graph"], [6, 2, 1, "", "MultiBinary"], [6, 2, 1, "", "MultiDiscrete"], [5, 2, 1, "", "Sequence"], [4, 2, 1, "", "Space"], [6, 2, 1, "", "Text"], [5, 2, 1, "", "Tuple"]], "gymnasium.spaces.Box": [[6, 4, 1, "", "is_bounded"], [6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Dict": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.Discrete": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Graph": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.MultiBinary": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.MultiDiscrete": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Sequence": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.Text": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Tuple": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.space.Space": [[4, 3, 1, "", "contains"], [4, 3, 1, "", "from_jsonable"], [4, 3, 1, "", "sample"], [4, 3, 1, "", "seed"], [4, 0, 1, "", "shape"], [4, 3, 1, "", "to_jsonable"]], "gymnasium.spaces.utils": [[7, 3, 1, "", "flatdim"], [7, 3, 1, "", "flatten"], [7, 3, 1, "", "flatten_space"], [7, 3, 1, "", "unflatten"]], "gymnasium.utils.env_checker": [[9, 3, 1, "", "check_env"]], "gymnasium.utils.play": [[9, 2, 1, "", "PlayPlot"], [9, 2, 1, "", "PlayableGame"], [9, 3, 1, "", "play"]], "gymnasium.utils.play.PlayPlot": [[9, 4, 1, "", "callback"]], "gymnasium.utils.play.PlayableGame": [[9, 4, 1, "", "process_event"]], "gymnasium.utils.save_video": [[9, 3, 1, "", "capped_cubic_video_schedule"], [9, 3, 1, "", "save_video"]], "gymnasium.utils.seeding": [[9, 3, 1, "", "np_random"]], "gymnasium.utils.step_api_compatibility": [[9, 3, 1, "", "convert_to_done_step_api"], [9, 3, 1, "", "convert_to_terminated_truncated_step_api"], [9, 3, 1, "", "step_api_compatibility"]], "gymnasium.vector": [[10, 2, 1, "", "AsyncVectorEnv"], [10, 2, 1, "", "SyncVectorEnv"], [10, 2, 1, "", "VectorEnv"], [10, 3, 1, "", "make"]], "gymnasium.vector.VectorEnv": [[10, 4, 1, "", "close"], [10, 4, 1, "", "reset"], [10, 4, 1, "", "step"]], "gymnasium.vector.utils": [[8, 3, 1, "", "batch_space"], [8, 3, 1, "", "concatenate"], [8, 3, 1, "", "create_empty_array"], [8, 3, 1, "", "create_shared_memory"], [8, 3, 1, "", "iterate"], [8, 3, 1, "", "read_from_shared_memory"], [8, 3, 1, "", "write_to_shared_memory"]], "gymnasium.wrappers": [[13, 2, 1, "", "AtariPreprocessing"], [13, 2, 1, "", "AutoResetWrapper"], [12, 2, 1, "", "ClipAction"], [13, 2, 1, "", "EnvCompatibility"], [14, 2, 1, "", "FilterObservation"], [14, 2, 1, "", "FlattenObservation"], [14, 2, 1, "", "FrameStack"], [14, 2, 1, "", "GrayScaleObservation"], [13, 2, 1, "", "HumanRendering"], [14, 2, 1, "", "NormalizeObservation"], [15, 2, 1, "", "NormalizeReward"], [13, 2, 1, "", "OrderEnforcing"], [13, 2, 1, "", "PassiveEnvChecker"], [14, 2, 1, "", "PixelObservationWrapper"], [13, 2, 1, "", "RecordEpisodeStatistics"], [13, 2, 1, "", "RecordVideo"], [13, 2, 1, "", "RenderCollection"], [12, 2, 1, "", "RescaleAction"], [14, 2, 1, "", "ResizeObservation"], [13, 2, 1, "", "StepAPICompatibility"], [14, 2, 1, "", "TimeAwareObservation"], [13, 2, 1, "", "TimeLimit"], [14, 2, 1, "", "TransformObservation"], [15, 2, 1, "", "TransformReward"], [13, 2, 1, "", "VectorListInfo"]]}, "objtypes": {"0": "py:property", "1": "py:attribute", "2": "py:class", "3": "py:function", "4": "py:method"}, "objnames": {"0": ["py", "property", "Python property"], "1": ["py", "attribute", "Python attribute"], "2": ["py", "class", "Python class"], "3": ["py", "function", "Python function"], "4": ["py", "method", "Python method"]}, "titleterms": {"404": 0, "page": [0, 1], "Not": 0, "found": 0, "The": [0, 105], "request": 0, "could": 0, "gymnasium": [1, 2, 10, 11, 17, 111], "doc": 1, "instruct": 1, "modifi": 1, "environ": [1, 2, 3, 9, 10, 13, 16, 17, 19, 105, 111], "edit": 1, "an": [1, 16], "ad": 1, "new": [1, 9], "atari": [1, 13, 20, 39], "env": [1, 2, 10, 16, 17, 105], "non": 1, "other": [1, 105], "step": [1, 9, 16, 17], "build": 1, "document": 1, "method": [2, 4, 10, 11], "attribut": [2, 4, 10, 11], "addit": 2, "implement": [2, 11], "registri": 3, "make": [3, 10, 17], "regist": [3, 17], "all": 3, "spec": 3, "space": [4, 5, 6, 7, 8, 16, 19, 20, 46, 47, 48, 49, 50, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 109], "fundament": [4, 6], "composit": [4, 5], "util": [4, 7, 8, 9], "vector": [4, 8, 10, 13, 19], "dict": 5, "tupl": 5, "sequenc": 5, "graph": 5, "box": [6, 34], "discret": 6, "multibinari": 6, "multidiscret": 6, "text": [6, 106], "share": [8, 19], "memori": [8, 19], "visual": 9, "save": 9, "render": [9, 13, 17], "video": [9, 13, 80, 105], "old": 9, "api": [9, 16, 111], "compat": [9, 13, 16], "seed": 9, "check": [9, 16], "vectorenv": 10, "async": 10, "sync": 10, "wrapper": [11, 12, 13, 14, 15, 16, 17], "custom": [11, 17, 19], "action": [12, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110], "clip": 12, "rescal": 12, "misc": 13, "preprocess": 13, "autoreset": 13, "passiv": 13, "checker": 13, "human": 13, "order": 13, "enforc": 13, "record": 13, "episod": [13, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "statist": 13, "collect": [13, 111], "time": [13, 14, 18], "limit": [13, 18], "list": [13, 39], "info": [13, 110], "observ": [14, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110], "transform": [14, 15], "filter": 14, "flatten": 14, "framestack": 14, "grai": 14, "scale": 14, "normal": [14, 15], "pixel": 14, "resiz": 14, "awar": 14, "reward": [15, 20, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110], "basic": 16, "usag": [16, 19], "initi": [16, 17], "interact": 16, "chang": 16, "backward": 16, "conform": 16, "plai": 16, "within": 16, "your": [17, 19], "own": 17, "subclass": 17, "declar": 17, "construct": 17, "from": 17, "state": [17, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "reset": [17, 85], "close": 17, "creat": [17, 19], "packag": 17, "instanc": 17, "us": 17, "handl": [18, 19], "termin": [18, 84, 85, 86], "truncat": [18, 92], "import": 18, "learn": [18, 105, 111], "code": 18, "solut": 18, "work": 19, "intermedi": 19, "except": 19, "advanc": 19, "autorom": 20, "instal": 20, "rom": 20, "stochast": 20, "common": 20, "argument": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110], "version": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110], "histori": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 109, 110], "name": [20, 60], "scheme": 20, "flavor": 20, "refer": [20, 85, 88, 111], "adventur": 21, "descript": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 107, 108, 110], "air": 22, "raid": 22, "alien": 23, "amidar": 24, "assault": 25, "asterix": 26, "asteroid": 27, "atlanti": 28, "bank": 29, "heist": 29, "battl": 30, "zone": 30, "beam": 31, "rider": 31, "berzerk": 32, "bowl": 33, "breakout": 35, "carniv": 36, "centiped": 37, "chopper": 38, "command": 38, "complet": 39, "crazi": 40, "climber": 40, "defend": 41, "demon": 42, "attack": 42, "doubl": [43, 99], "dunk": 43, "elev": 44, "enduro": 45, "fishingderbi": 46, "freewai": 47, "frostbit": 48, "gopher": 49, "gravitar": 50, "hero": 51, "icehockei": 52, "jamesbond": 53, "journeyescap": 54, "kangaroo": 55, "krull": 56, "kung": 57, "fu": 57, "master": 57, "montezuma": 58, "reveng": 58, "m": 59, "pacman": 59, "thi": 60, "game": [60, 105], "phoenix": 61, "pitfal": 62, "pong": 63, "pooyan": 64, "privateey": 65, "qbert": 66, "riverraid": 67, "road": 68, "runner": 68, "robot": [69, 105], "tank": 69, "seaquest": 70, "ski": 71, "solari": 72, "spaceinvad": 73, "stargunn": 74, "tenni": 75, "timepilot": 76, "tutankham": 77, "up": 78, "n": 78, "down": 78, "ventur": 79, "pinbal": 80, "wizard": 81, "wor": 81, "zaxxon": 82, "box2d": 83, "biped": 84, "walker": 84, "start": [84, 85, 86, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "credit": [84, 85, 86], "car": [85, 90, 91], "race": [85, 105], "lunar": 86, "lander": 86, "classic": [87, 105], "control": [87, 105], "acrobot": 88, "end": [88, 89, 90, 91, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104], "cart": 89, "pole": 89, "mountain": [90, 91], "transit": [90, 91], "dynam": [90, 91], "continu": 91, "pendulum": [92, 99, 100], "mujoco": 93, "ant": 94, "half": 95, "cheetah": 95, "hopper": 96, "humanoid": [97, 98], "standup": 98, "invert": [99, 100], "pusher": 101, "reacher": 102, "swimmer": 103, "note": 103, "walker2d": 104, "third": 105, "parti": 105, "vizdoom": 105, "flappi": 105, "bird": 105, "gym": 105, "A": 105, "openai": 105, "derk": 105, "gpu": 105, "acceler": 105, "moba": 105, "minerl": 105, "procgen": 105, "slimevolleygym": 105, "simpl": 105, "singl": 105, "multi": 105, "agent": 105, "reinforc": [105, 111], "stabl": 105, "retro": 105, "uniti": 105, "ml": 105, "board": 105, "card": 105, "etc": 105, "abalon": 105, "two": 105, "player": 105, "abstract": 105, "strategi": 105, "spoof": 105, "xiangqi": 105, "chines": 105, "chess": 105, "rubikscubegym": 105, "gymgo": 105, "gymfc": 105, "flight": 105, "tune": 105, "train": 105, "framework": 105, "gazebo": 105, "goddard": 105, "": 105, "rocket": 105, "problem": 105, "jimini": 105, "miniworld": 105, "pybullet": 105, "drone": 105, "marsexplor": 105, "panda": 105, "robo": 105, "offworld": 105, "autonom": 105, "drive": 105, "traffic": 105, "carla": 105, "duckietown": 105, "electr": 105, "motor": 105, "highwai": 105, "longicontrol": 105, "sumo": 105, "rl": 105, "commonroad": 105, "pettingzoo": 105, "anomalous_rl_env": 105, "carl": 105, "compilergym": 105, "dacbench": 105, "gridworld": 105, "adserv": 105, "algorithm": 105, "anytrad": 105, "autokei": 105, "ccc": 105, "cellular": 105, "automata": 105, "inventori": 105, "maze": 105, "mtsim": 105, "legaci": 105, "toytext": 105, "riverswim": 105, "recsi": 105, "sokoban": 105, "math": 105, "prog": 105, "synth": 105, "nasgym": 105, "nlpgym": 105, "toolkit": 105, "develop": 105, "solv": 105, "nlp": 105, "task": 105, "obstacl": 105, "tower": 105, "openmodelica": 105, "microgrid": 105, "osim": 105, "pge": 105, "parallel": 105, "engin": 105, "qasgym": 105, "safe": 105, "virtualtaobao": 105, "mo": 105, "abid": 105, "satur": 105, "shinrl": 105, "go": 105, "explor": 105, "tmrl": 105, "racing_dream": 105, "racecar_gym": 105, "evogym": 105, "design": 105, "tool": 105, "l2r": 105, "gym_torc": 105, "mobil": 105, "softrobot": 105, "pyelastica": 105, "tuxkart": 105, "ai": 105, "ostrichrl": 105, "quadrup": 105, "pogo": 105, "stick": 105, "jump": 105, "igibson": 105, "snakerl": 105, "starship": 105, "land": 105, "raveforc": 105, "line": 105, "follow": 105, "dexteroushand": 105, "omniisaacgymenv": 105, "border": 105, "spacerobotenv": 105, "gymnax": 105, "toi": 106, "blackjack": 107, "cliff": 108, "walk": 108, "frozen": 109, "lake": 109, "taxi": 110, "i": 111, "standard": 111, "divers": 111}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 8, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx": 57}, "alltitles": {"404 - Page Not Found": [[0, "page-not-found"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Gymnasium-docs": [[1, "gymnasium-docs"]], "Instructions for modifying environment pages": [[1, "instructions-for-modifying-environment-pages"]], "Editing an environment page": [[1, "editing-an-environment-page"]], "Adding a new environment": [[1, "adding-a-new-environment"]], "Atari env": [[1, "atari-env"]], "Non-Atari env": [[1, "non-atari-env"]], "Other steps": [[1, "other-steps"]], "Build the Documentation": [[1, "build-the-documentation"]], "Env": [[2, "env"]], "gymnasium.Env": [[2, "gymnasium-env"]], "Methods": [[2, "methods"], [4, "methods"], [10, "methods"], [11, "methods"]], "Attributes": [[2, "attributes"], [4, "attributes"], [10, "attributes"], [11, "attributes"]], "Additional Methods": [[2, "additional-methods"]], "Implementing environments": [[2, "implementing-environments"]], "Registry": [[3, "registry"]], "Make": [[3, "make"]], "Register": [[3, "register"]], "All registered environments": [[3, "all-registered-environments"]], "Spec": [[3, "spec"]], "Spaces": [[4, "spaces"], [16, "spaces"]], "Fundamental Spaces": [[4, "fundamental-spaces"], [6, "fundamental-spaces"]], "Composite Spaces": [[4, "composite-spaces"], [5, "composite-spaces"]], "Utils": [[4, "utils"], [9, "utils"]], "Vector Utils": [[4, "vector-utils"]], "Dict": [[5, "dict"]], "Tuple": [[5, "tuple"]], "Sequence": [[5, "sequence"]], "Graph": [[5, "graph"]], "Box": [[6, "box"]], "Discrete": [[6, "discrete"]], "MultiBinary": [[6, "multibinary"]], "MultiDiscrete": [[6, "multidiscrete"]], "Text": [[6, "text"]], "Spaces Utils": [[7, "spaces-utils"]], "Spaces Vector Utils": [[8, "spaces-vector-utils"]], "Shared Memory Utils": [[8, "shared-memory-utils"]], "Visualization": [[9, "visualization"]], "Save Rendering Videos": [[9, "save-rendering-videos"]], "Old to New Step API Compatibility": [[9, "old-to-new-step-api-compatibility"]], "Seeding": [[9, "seeding"]], "Environment Checking": [[9, "environment-checking"]], "Vector": [[10, "vector"]], "Gymnasium.vector.VectorEnv": [[10, "gymnasium-vector-vectorenv"]], "Making Vector Environments": [[10, "making-vector-environments"]], "Async Vector Env": [[10, "async-vector-env"]], "Sync Vector Env": [[10, "sync-vector-env"]], "Wrappers": [[11, "wrappers"], [16, "wrappers"]], "gymnasium.Wrapper": [[11, "gymnasium-wrapper"]], "Gymnasium Wrappers": [[11, "gymnasium-wrappers"]], "Implementing a custom wrapper": [[11, "implementing-a-custom-wrapper"]], "Action Wrappers": [[12, "action-wrappers"]], "Action Wrapper": [[12, "action-wrapper"]], "Clip Action": [[12, "clip-action"]], "Rescale Action": [[12, "rescale-action"]], "Misc Wrappers": [[13, "misc-wrappers"]], "Atari Preprocessing": [[13, "atari-preprocessing"]], "Autoreset": [[13, "autoreset"]], "Compatibility": [[13, "compatibility"]], "Passive Environment Checker": [[13, "passive-environment-checker"]], "Human Rendering": [[13, "human-rendering"]], "Order Enforcing": [[13, "order-enforcing"]], "Record Episode Statistics": [[13, "record-episode-statistics"]], "Record Video": [[13, "record-video"]], "Render Collection": [[13, "render-collection"]], "Time Limit": [[13, "time-limit"]], "Vector List Info": [[13, "vector-list-info"]], "Observation Wrappers": [[14, "observation-wrappers"]], "Observation Wrapper": [[14, "observation-wrapper"]], "Transform Observation": [[14, "transform-observation"]], "Filter Observation": [[14, "filter-observation"]], "Flatten Observation": [[14, "flatten-observation"]], "Framestack Observations": [[14, "framestack-observations"]], "Gray Scale Observation": [[14, "gray-scale-observation"]], "Normalize Observation": [[14, "normalize-observation"]], "Pixel Observation Wrapper": [[14, "pixel-observation-wrapper"]], "Resize Observation": [[14, "resize-observation"]], "Time Aware Observation": [[14, "time-aware-observation"]], "Reward Wrappers": [[15, "reward-wrappers"]], "Reward Wrapper": [[15, "reward-wrapper"]], "Transform Reward": [[15, "transform-reward"]], "Normalize Reward": [[15, "normalize-reward"]], "Basic Usage": [[16, "basic-usage"]], "Initializing Environments": [[16, "initializing-environments"]], "Interacting with the Environment": [[16, "interacting-with-the-environment"]], "Change in env.step API": [[16, "change-in-env-step-api"]], "Backward compatibility": [[16, "backward-compatibility"]], "Checking API-Conformity": [[16, "checking-api-conformity"]], "Playing within an environment": [[16, "playing-within-an-environment"]], "Make your own custom environment": [[17, "make-your-own-custom-environment"]], "Subclassing gymnasium.Env": [[17, "subclassing-gymnasium-env"]], "Declaration and Initialization": [[17, "declaration-and-initialization"]], "Constructing Observations From Environment States": [[17, "constructing-observations-from-environment-states"]], "Reset": [[17, "reset"]], "Step": [[17, "step"]], "Rendering": [[17, "rendering"]], "Close": [[17, "close"]], "Registering Envs": [[17, "registering-envs"]], "Creating a Package": [[17, "creating-a-package"]], "Creating Environment Instances": [[17, "creating-environment-instances"]], "Using Wrappers": [[17, "using-wrappers"]], "Handling Time Limits": [[18, "handling-time-limits"]], "Termination": [[18, "termination"]], "Truncation": [[18, "truncation"]], "Importance in learning code": [[18, "importance-in-learning-code"]], "Solution": [[18, "solution"]], "Vectorizing your environments": [[19, "vectorizing-your-environments"]], "Vectorized Environments": [[19, "vectorized-environments"]], "Creating a vectorized environment": [[19, "creating-a-vectorized-environment"]], "Working with vectorized environments": [[19, "working-with-vectorized-environments"]], "Observation & Action spaces": [[19, "observation-action-spaces"]], "Intermediate Usage": [[19, "intermediate-usage"]], "Shared memory": [[19, "shared-memory"]], "Exception handling": [[19, "exception-handling"]], "Advanced Usage": [[19, "advanced-usage"]], "Custom spaces": [[19, "custom-spaces"]], "Atari": [[20, "atari"]], "AutoROM (installing the ROMs)": [[20, "autorom-installing-the-roms"]], "Action Space": [[20, "action-space"], [46, "action-space"], [47, "action-space"], [48, "action-space"], [49, "action-space"], [50, "action-space"], [84, "action-space"], [85, "action-space"], [86, "action-space"], [88, "action-space"], [89, "action-space"], [90, "action-space"], [91, "action-space"], [92, "action-space"], [94, "action-space"], [95, "action-space"], [96, "action-space"], [97, "action-space"], [98, "action-space"], [99, "action-space"], [100, "action-space"], [101, "action-space"], [102, "action-space"], [103, "action-space"], [104, "action-space"], [107, "action-space"], [109, "action-space"]], "Observation Space": [[20, "observation-space"], [84, "observation-space"], [85, "observation-space"], [86, "observation-space"], [88, "observation-space"], [89, "observation-space"], [90, "observation-space"], [91, "observation-space"], [92, "observation-space"], [94, "observation-space"], [95, "observation-space"], [96, "observation-space"], [97, "observation-space"], [98, "observation-space"], [99, "observation-space"], [100, "observation-space"], [101, "observation-space"], [102, "observation-space"], [103, "observation-space"], [104, "observation-space"], [107, "observation-space"], [109, "observation-space"]], "Rewards": [[20, "rewards"], [23, "rewards"], [24, "rewards"], [26, "rewards"], [27, "rewards"], [28, "rewards"], [29, "rewards"], [30, "rewards"], [31, "rewards"], [32, "rewards"], [33, "rewards"], [34, "rewards"], [35, "rewards"], [36, "rewards"], [37, "rewards"], [38, "rewards"], [40, "rewards"], [41, "rewards"], [42, "rewards"], [43, "rewards"], [44, "rewards"], [45, "rewards"], [46, "rewards"], [47, "rewards"], [48, "rewards"], [49, "rewards"], [50, "rewards"], [51, "rewards"], [52, "rewards"], [53, "rewards"], [54, "rewards"], [55, "rewards"], [56, "rewards"], [62, "rewards"], [63, "rewards"], [64, "rewards"], [65, "rewards"], [66, "rewards"], [67, "rewards"], [68, "rewards"], [69, "rewards"], [70, "rewards"], [71, "rewards"], [72, "rewards"], [73, "rewards"], [74, "rewards"], [75, "rewards"], [76, "rewards"], [84, "rewards"], [85, "rewards"], [86, "rewards"], [88, "rewards"], [89, "rewards"], [92, "rewards"], [94, "rewards"], [95, "rewards"], [96, "rewards"], [97, "rewards"], [98, "rewards"], [99, "rewards"], [100, "rewards"], [101, "rewards"], [102, "rewards"], [103, "rewards"], [104, "rewards"], [107, "rewards"], [109, "rewards"], [110, "rewards"]], "Stochasticity": [[20, "stochasticity"]], "Common Arguments": [[20, "common-arguments"]], "Version History and Naming Schemes": [[20, "version-history-and-naming-schemes"]], "Flavors": [[20, "flavors"]], "References": [[20, "references"], [85, "references"], [88, "references"]], "Adventure": [[21, "adventure"]], "Description": [[21, "description"], [22, "description"], [23, "description"], [24, "description"], [25, "description"], [26, "description"], [27, "description"], [28, "description"], [29, "description"], [30, "description"], [31, "description"], [32, "description"], [33, "description"], [34, "description"], [35, "description"], [36, "description"], [37, "description"], [38, "description"], [40, "description"], [41, "description"], [42, "description"], [43, "description"], [44, "description"], [45, "description"], [46, "description"], [47, "description"], [48, "description"], [49, "description"], [50, "description"], [51, "description"], [52, "description"], [53, "description"], [54, "description"], [55, "description"], [56, "description"], [57, "description"], [58, "description"], [59, "description"], [60, "description"], [61, "description"], [62, "description"], [63, "description"], [64, "description"], [65, "description"], [66, "description"], [67, "description"], [68, "description"], [69, "description"], [70, "description"], [71, "description"], [72, "description"], [73, "description"], [74, "description"], [75, "description"], [76, "description"], [77, "description"], [78, "description"], [79, "description"], [80, "description"], [81, "description"], [82, "description"], [84, "description"], [85, "description"], [86, "description"], [88, "description"], [89, "description"], [90, "description"], [91, "description"], [92, "description"], [94, "description"], [95, "description"], [96, "description"], [97, "description"], [98, "description"], [99, "description"], [100, "description"], [101, "description"], [102, "description"], [103, "description"], [104, "description"], [107, "description"], [108, "description"], [110, "description"]], "Actions": [[21, "actions"], [22, "actions"], [23, "actions"], [24, "actions"], [25, "actions"], [26, "actions"], [27, "actions"], [28, "actions"], [29, "actions"], [30, "actions"], [31, "actions"], [32, "actions"], [33, "actions"], [34, "actions"], [35, "actions"], [36, "actions"], [37, "actions"], [38, "actions"], [40, "actions"], [41, "actions"], [42, "actions"], [43, "actions"], [44, "actions"], [45, "actions"], [51, "actions"], [52, "actions"], [53, "actions"], [54, "actions"], [55, "actions"], [56, "actions"], [57, "actions"], [58, "actions"], [59, "actions"], [60, "actions"], [61, "actions"], [62, "actions"], [63, "actions"], [64, "actions"], [65, "actions"], [66, "actions"], [67, "actions"], [68, "actions"], [69, "actions"], [70, "actions"], [71, "actions"], [72, "actions"], [73, "actions"], [74, "actions"], [75, "actions"], [76, "actions"], [77, "actions"], [78, "actions"], [79, "actions"], [80, "actions"], [81, "actions"], [82, "actions"], [108, "actions"], [110, "actions"]], "Observations": [[21, "observations"], [22, "observations"], [23, "observations"], [24, "observations"], [25, "observations"], [26, "observations"], [27, "observations"], [28, "observations"], [29, "observations"], [30, "observations"], [31, "observations"], [32, "observations"], [33, "observations"], [34, "observations"], [35, "observations"], [36, "observations"], [37, "observations"], [38, "observations"], [40, "observations"], [41, "observations"], [42, "observations"], [43, "observations"], [44, "observations"], [45, "observations"], [46, "observations"], [47, "observations"], [48, "observations"], [49, "observations"], [50, "observations"], [51, "observations"], [52, "observations"], [53, "observations"], [54, "observations"], [55, "observations"], [56, "observations"], [57, "observations"], [58, "observations"], [59, "observations"], [60, "observations"], [61, "observations"], [62, "observations"], [63, "observations"], [64, "observations"], [65, "observations"], [66, "observations"], [67, "observations"], [68, "observations"], [69, "observations"], [70, "observations"], [71, "observations"], [72, "observations"], [73, "observations"], [74, "observations"], [75, "observations"], [76, "observations"], [77, "observations"], [78, "observations"], [79, "observations"], [80, "observations"], [81, "observations"], [82, "observations"], [108, "observations"], [110, "observations"]], "Arguments": [[21, "arguments"], [22, "arguments"], [23, "arguments"], [24, "arguments"], [25, "arguments"], [26, "arguments"], [27, "arguments"], [28, "arguments"], [29, "arguments"], [30, "arguments"], [31, "arguments"], [32, "arguments"], [33, "arguments"], [34, "arguments"], [35, "arguments"], [36, "arguments"], [37, "arguments"], [38, "arguments"], [40, "arguments"], [41, "arguments"], [42, "arguments"], [43, "arguments"], [44, "arguments"], [45, "arguments"], [46, "arguments"], [47, "arguments"], [48, "arguments"], [49, "arguments"], [50, "arguments"], [51, "arguments"], [52, "arguments"], [53, "arguments"], [54, "arguments"], [55, "arguments"], [56, "arguments"], [57, "arguments"], [58, "arguments"], [59, "arguments"], [60, "arguments"], [61, "arguments"], [62, "arguments"], [63, "arguments"], [64, "arguments"], [65, "arguments"], [66, "arguments"], [67, "arguments"], [68, "arguments"], [69, "arguments"], [70, "arguments"], [71, "arguments"], [72, "arguments"], [73, "arguments"], [74, "arguments"], [75, "arguments"], [76, "arguments"], [77, "arguments"], [78, "arguments"], [79, "arguments"], [80, "arguments"], [81, "arguments"], [82, "arguments"], [84, "arguments"], [85, "arguments"], [86, "arguments"], [88, "arguments"], [89, "arguments"], [90, "arguments"], [91, "arguments"], [92, "arguments"], [94, "arguments"], [95, "arguments"], [96, "arguments"], [97, "arguments"], [98, "arguments"], [99, "arguments"], [100, "arguments"], [101, "arguments"], [102, "arguments"], [103, "arguments"], [104, "arguments"], [107, "arguments"], [108, "arguments"], [109, "arguments"], [110, "arguments"]], "Version History": [[21, "version-history"], [22, "version-history"], [23, "version-history"], [24, "version-history"], [25, "version-history"], [26, "version-history"], [27, "version-history"], [28, "version-history"], [29, "version-history"], [30, "version-history"], [31, "version-history"], [32, "version-history"], [33, "version-history"], [34, "version-history"], [35, "version-history"], [36, "version-history"], [37, "version-history"], [38, "version-history"], [40, "version-history"], [41, "version-history"], [42, "version-history"], [43, "version-history"], [44, "version-history"], [45, "version-history"], [46, "version-history"], [47, "version-history"], [48, "version-history"], [49, "version-history"], [50, "version-history"], [51, "version-history"], [52, "version-history"], [53, "version-history"], [54, "version-history"], [55, "version-history"], [56, "version-history"], [57, "version-history"], [58, "version-history"], [59, "version-history"], [60, "version-history"], [61, "version-history"], [62, "version-history"], [63, "version-history"], [64, "version-history"], [65, "version-history"], [66, "version-history"], [67, "version-history"], [68, "version-history"], [69, "version-history"], [70, "version-history"], [71, "version-history"], [72, "version-history"], [73, "version-history"], [74, "version-history"], [75, "version-history"], [76, "version-history"], [77, "version-history"], [78, "version-history"], [79, "version-history"], [80, "version-history"], [81, "version-history"], [82, "version-history"], [84, "version-history"], [85, "version-history"], [86, "version-history"], [88, "version-history"], [90, "version-history"], [91, "version-history"], [92, "version-history"], [94, "version-history"], [95, "version-history"], [96, "version-history"], [97, "version-history"], [98, "version-history"], [99, "version-history"], [100, "version-history"], [101, "version-history"], [102, "version-history"], [103, "version-history"], [104, "version-history"], [107, "version-history"], [108, "version-history"], [109, "version-history"], [110, "version-history"]], "Air Raid": [[22, "air-raid"]], "Alien": [[23, "alien"]], "Amidar": [[24, "amidar"]], "Assault": [[25, "assault"]], "Asterix": [[26, "asterix"]], "Asteroids": [[27, "asteroids"]], "Atlantis": [[28, "atlantis"]], "Bank Heist": [[29, "bank-heist"]], "Battle Zone": [[30, "battle-zone"]], "Beam Rider": [[31, "beam-rider"]], "Berzerk": [[32, "berzerk"]], "Bowling": [[33, "bowling"]], "Boxing": [[34, "boxing"]], "Breakout": [[35, "breakout"]], "Carnival": [[36, "carnival"]], "Centipede": [[37, "centipede"]], "Chopper Command": [[38, "chopper-command"]], "Complete List - Atari": [[39, "complete-list-atari"]], "Crazy Climber": [[40, "crazy-climber"]], "Defender": [[41, "defender"]], "Demon Attack": [[42, "demon-attack"]], "Double Dunk": [[43, "double-dunk"]], "Elevator Action": [[44, "elevator-action"]], "Enduro": [[45, "enduro"]], "FishingDerby": [[46, "fishingderby"]], "Freeway": [[47, "freeway"]], "Frostbite": [[48, "frostbite"]], "Gopher": [[49, "gopher"]], "Gravitar": [[50, "gravitar"]], "Hero": [[51, "hero"]], "IceHockey": [[52, "icehockey"]], "Jamesbond": [[53, "jamesbond"]], "JourneyEscape": [[54, "journeyescape"]], "Kangaroo": [[55, "kangaroo"]], "Krull": [[56, "krull"]], "Kung Fu Master": [[57, "kung-fu-master"]], "Montezuma Revenge": [[58, "montezuma-revenge"]], "Ms Pacman": [[59, "ms-pacman"]], "Name This Game": [[60, "name-this-game"]], "Phoenix": [[61, "phoenix"]], "Pitfall": [[62, "pitfall"]], "Pong": [[63, "pong"]], "Pooyan": [[64, "pooyan"]], "PrivateEye": [[65, "privateeye"]], "Qbert": [[66, "qbert"]], "Riverraid": [[67, "riverraid"]], "Road Runner": [[68, "road-runner"]], "Robot Tank": [[69, "robot-tank"]], "Seaquest": [[70, "seaquest"]], "Skiings": [[71, "skiings"]], "Solaris": [[72, "solaris"]], "SpaceInvaders": [[73, "spaceinvaders"]], "StarGunner": [[74, "stargunner"]], "Tennis": [[75, "tennis"]], "TimePilot": [[76, "timepilot"]], "Tutankham": [[77, "tutankham"]], "Up n\u2019 Down": [[78, "up-n-down"]], "Venture": [[79, "venture"]], "Video Pinball": [[80, "video-pinball"]], "Wizard of Wor": [[81, "wizard-of-wor"]], "Zaxxon": [[82, "zaxxon"]], "Box2D": [[83, "box2d"]], "Bipedal Walker": [[84, "bipedal-walker"]], "Starting State": [[84, "starting-state"], [85, "starting-state"], [86, "starting-state"], [88, "starting-state"], [89, "starting-state"], [90, "starting-state"], [91, "starting-state"], [92, "starting-state"], [94, "starting-state"], [95, "starting-state"], [96, "starting-state"], [97, "starting-state"], [98, "starting-state"], [99, "starting-state"], [100, "starting-state"], [101, "starting-state"], [102, "starting-state"], [103, "starting-state"], [104, "starting-state"]], "Episode Termination": [[84, "episode-termination"], [85, "episode-termination"], [86, "episode-termination"]], "Credits": [[84, "credits"], [85, "credits"], [86, "credits"]], "Car Racing": [[85, "car-racing"]], "Reset Arguments": [[85, "reset-arguments"]], "Lunar Lander": [[86, "lunar-lander"]], "Classic Control": [[87, "classic-control"]], "Acrobot": [[88, "acrobot"]], "Episode End": [[88, "episode-end"], [89, "episode-end"], [90, "episode-end"], [91, "episode-end"], [94, "episode-end"], [95, "episode-end"], [96, "episode-end"], [97, "episode-end"], [98, "episode-end"], [99, "episode-end"], [100, "episode-end"], [101, "episode-end"], [102, "episode-end"], [103, "episode-end"], [104, "episode-end"]], "Cart Pole": [[89, "cart-pole"]], "Mountain Car": [[90, "mountain-car"]], "Transition Dynamics:": [[90, "transition-dynamics"], [91, "transition-dynamics"]], "Reward:": [[90, "reward"]], "Mountain Car Continuous": [[91, "mountain-car-continuous"]], "Reward": [[91, "reward"], [108, "reward"]], "Pendulum": [[92, "pendulum"]], "Episode Truncation": [[92, "episode-truncation"]], "MuJoCo": [[93, "mujoco"]], "Ant": [[94, "ant"]], "Half Cheetah": [[95, "half-cheetah"]], "Hopper": [[96, "hopper"]], "Humanoid": [[97, "humanoid"]], "Humanoid Standup": [[98, "humanoid-standup"]], "Inverted Double Pendulum": [[99, "inverted-double-pendulum"]], "Inverted Pendulum": [[100, "inverted-pendulum"]], "Pusher": [[101, "pusher"]], "Reacher": [[102, "reacher"]], "Swimmer": [[103, "swimmer"]], "Notes": [[103, "notes"]], "Walker2D": [[104, "walker2d"]], "Third-Party Environments": [[105, "third-party-environments"]], "Video Game Environments": [[105, "video-game-environments"]], "ViZDoom": [[105, "vizdoom"]], " flappy-bird-gym: A Flappy Bird environment for OpenAI Gym": [[105, "flappy-bird-gym-a-flappy-bird-environment-for-openai-gym"]], " gym-derk: GPU accelerated MOBA environment": [[105, "gym-derk-gpu-accelerated-moba-environment"]], " MineRL": [[105, "minerl"]], " Procgen": [[105, "procgen"]], " SlimeVolleyGym: A simple environment for single and multi-agent reinforcement learning": [[105, "slimevolleygym-a-simple-environment-for-single-and-multi-agent-reinforcement-learning"]], " stable-retro": [[105, "stable-retro"]], " Unity ML Agents": [[105, "unity-ml-agents"]], "Classic Environments (board, card, etc. games)": [[105, "classic-environments-board-card-etc-games"]], " gym-abalone: A two-player abstract strategy board game": [[105, "gym-abalone-a-two-player-abstract-strategy-board-game"]], " gym-spoof": [[105, "gym-spoof"]], " gym-xiangqi: Xiangqi - The Chinese Chess Game": [[105, "gym-xiangqi-xiangqi-the-chinese-chess-game"]], " RubiksCubeGym": [[105, "rubikscubegym"]], " GymGo": [[105, "gymgo"]], "Robotics Environments": [[105, "robotics-environments"]], " GymFC: A flight control tuning and training framework": [[105, "gymfc-a-flight-control-tuning-and-training-framework"]], " gym-gazebo": [[105, "gym-gazebo"]], " gym-goddard: Goddard\u2019s Rocket Problem": [[105, "gym-goddard-goddard-s-rocket-problem"]], " gym-jiminy: training Robots in Jiminy": [[105, "gym-jiminy-training-robots-in-jiminy"]], " gym-miniworld": [[105, "gym-miniworld"]], " gym-pybullet-drones": [[105, "gym-pybullet-drones"]], " MarsExplorer": [[105, "marsexplorer"]], " panda-gym ": [[105, "panda-gym"]], " PyBullet Robotics Environments": [[105, "pybullet-robotics-environments"]], " robo-gym": [[105, "robo-gym"]], " Offworld-gym": [[105, "offworld-gym"]], "Autonomous Driving and Traffic Control Environments": [[105, "autonomous-driving-and-traffic-control-environments"]], " gym-carla": [[105, "gym-carla"]], " gym-duckietown": [[105, "gym-duckietown"]], " gym-electric-motor": [[105, "gym-electric-motor"]], " highway-env": [[105, "highway-env"]], " LongiControl": [[105, "longicontrol"]], " sumo-rl": [[105, "sumo-rl"]], " CommonRoad-RL": [[105, "commonroad-rl"]], "Multi-Agents": [[105, "multi-agents"]], "PettingZoo": [[105, "pettingzoo"]], "Other Environments": [[105, "other-environments"]], " anomalous_rl_envs": [[105, "anomalous-rl-envs"]], " CARL": [[105, "carl"]], " CompilerGym": [[105, "compilergym"]], " DACBench": [[105, "dacbench"]], " Gridworld": [[105, "gridworld"]], " gym-adserve": [[105, "gym-adserve"]], " gym-algorithmic": [[105, "gym-algorithmic"]], " gym-anytrading": [[105, "gym-anytrading"]], " gym-autokey": [[105, "gym-autokey"]], " gym-ccc": [[105, "gym-ccc"]], " gym-cellular-automata": [[105, "gym-cellular-automata"]], " gym-games": [[105, "gym-games"]], " gym-inventory": [[105, "gym-inventory"]], " gym-maze": [[105, "gym-maze"]], " gym-mtsim": [[105, "gym-mtsim"]], " gym-legacy-toytext": [[105, "gym-legacy-toytext"]], " gym-riverswim": [[105, "gym-riverswim"]], " gym-recsys": [[105, "gym-recsys"]], " gym-sokoban": [[105, "gym-sokoban"]], " math-prog-synth-env": [[105, "math-prog-synth-env"]], " NASGym": [[105, "nasgym"]], " NLPGym: A toolkit to develop RL agents to solve NLP tasks": [[105, "nlpgym-a-toolkit-to-develop-rl-agents-to-solve-nlp-tasks"]], " Obstacle Tower": [[105, "obstacle-tower"]], " openmodelica-microgrid-gym": [[105, "openmodelica-microgrid-gym"]], " osim-rl": [[105, "osim-rl"]], " PGE: Parallel Game Engine": [[105, "pge-parallel-game-engine"]], " QASGym": [[105, "qasgym"]], " safe-control-gym": [[105, "safe-control-gym"]], " VirtualTaobao": [[105, "virtualtaobao"]], " mo-gym": [[105, "mo-gym"]], "ABIDES-Gym": [[105, "abides-gym"]], "gym-saturation": [[105, "gym-saturation"]], "ShinRL": [[105, "shinrl"]], "racing-rl": [[105, "racing-rl"]], "go-explore": [[105, "go-explore"]], "tmrl": [[105, "tmrl"]], "racing_dreamer": [[105, "racing-dreamer"]], "racecar_gym": [[105, "racecar-gym"]], "jiminy": [[105, "jiminy"]], "evogym-design-tool": [[105, "evogym-design-tool"]], "l2r": [[105, "l2r"]], "gym_torcs": [[105, "gym-torcs"]], "mobile-env": [[105, "mobile-env"]], "gym-softrobot": [[105, "gym-softrobot"]], "PyElastica": [[105, "pyelastica"]], "tuxkart-ai": [[105, "tuxkart-ai"]], "ostrichrl": [[105, "ostrichrl"]], "quadruped-gym": [[105, "quadruped-gym"]], "Pogo-Stick-Jumping": [[105, "pogo-stick-jumping"]], "evogym": [[105, "evogym"]], "iGibson": [[105, "igibson"]], "SnakeRL": [[105, "snakerl"]], "starship-landing-gym": [[105, "starship-landing-gym"]], "CompilerGym": [[105, "id1"]], "RaveForce": [[105, "raveforce"]], "gym-line-follower": [[105, "gym-line-follower"]], "DexterousHands": [[105, "dexteroushands"]], "OmniIsaacGymEnvs": [[105, "omniisaacgymenvs"]], "border": [[105, "border"]], "SpaceRobotEnv": [[105, "spacerobotenv"]], "gymnax": [[105, "gymnax"]], "Toy Text": [[106, "toy-text"]], "Blackjack": [[107, "blackjack"]], "Cliff Walking": [[108, "cliff-walking"]], "Frozen Lake": [[109, "frozen-lake"]], "Taxi": [[110, "taxi"]], "Info": [[110, "info"]], "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments": [[111, "gymnasium-is-a-standard-api-for-reinforcement-learning-and-a-diverse-collection-of-reference-environments"]]}, "indexentries": {"env (class in gymnasium)": [[2, "gymnasium.Env"]], "action_space (gymnasium.env attribute)": [[2, "gymnasium.Env.action_space"]], "close() (in module gymnasium.env)": [[2, "gymnasium.Env.close"]], "metadata (gymnasium.env attribute)": [[2, "gymnasium.Env.metadata"]], "np_random (gymnasium.env property)": [[2, "gymnasium.Env.np_random"]], "observation_space (gymnasium.env attribute)": [[2, "gymnasium.Env.observation_space"]], "render() (in module gymnasium.env)": [[2, "gymnasium.Env.render"]], "render_mode (gymnasium.env attribute)": [[2, "gymnasium.Env.render_mode"]], "reset() (in module gymnasium.env)": [[2, "gymnasium.Env.reset"]], "reward_range (gymnasium.env attribute)": [[2, "gymnasium.Env.reward_range"]], "spec (gymnasium.env attribute)": [[2, "gymnasium.Env.spec"]], "step() (in module gymnasium.env)": [[2, "gymnasium.Env.step"]], "unwrapped (gymnasium.env property)": [[2, "gymnasium.Env.unwrapped"]], "make() (in module gymnasium)": [[3, "gymnasium.make"]], "register() (in module gymnasium)": [[3, "gymnasium.register"]], "spec() (in module gymnasium)": [[3, "gymnasium.spec"]], "space (class in gymnasium.spaces)": [[4, "gymnasium.spaces.Space"]], "contains() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.contains"]], "dtype (space property)": [[4, "Space.dtype"]], "from_jsonable() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.from_jsonable"]], "sample() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.sample"]], "seed() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.seed"]], "shape (gymnasium.spaces.space.space property)": [[4, "gymnasium.spaces.space.Space.shape"]], "to_jsonable() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.to_jsonable"]], "dict (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Dict"]], "graph (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Graph"]], "sequence (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Sequence"]], "tuple (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Tuple"]], "sample() (gymnasium.spaces.dict method)": [[5, "gymnasium.spaces.Dict.sample"]], "sample() (gymnasium.spaces.graph method)": [[5, "gymnasium.spaces.Graph.sample"]], "sample() (gymnasium.spaces.sequence method)": [[5, "gymnasium.spaces.Sequence.sample"]], "sample() (gymnasium.spaces.tuple method)": [[5, "gymnasium.spaces.Tuple.sample"]], "seed() (gymnasium.spaces.dict method)": [[5, "gymnasium.spaces.Dict.seed"]], "seed() (gymnasium.spaces.graph method)": [[5, "gymnasium.spaces.Graph.seed"]], "seed() (gymnasium.spaces.sequence method)": [[5, "gymnasium.spaces.Sequence.seed"]], "seed() (gymnasium.spaces.tuple method)": [[5, "gymnasium.spaces.Tuple.seed"]], "box (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Box"]], "discrete (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Discrete"]], "multibinary (class in gymnasium.spaces)": [[6, "gymnasium.spaces.MultiBinary"]], "multidiscrete (class in gymnasium.spaces)": [[6, "gymnasium.spaces.MultiDiscrete"]], "text (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Text"]], "is_bounded() (gymnasium.spaces.box method)": [[6, "gymnasium.spaces.Box.is_bounded"]], "sample() (gymnasium.spaces.box method)": [[6, "gymnasium.spaces.Box.sample"]], "sample() (gymnasium.spaces.discrete method)": [[6, "gymnasium.spaces.Discrete.sample"]], "sample() (gymnasium.spaces.multibinary method)": [[6, "gymnasium.spaces.MultiBinary.sample"]], "sample() (gymnasium.spaces.multidiscrete method)": [[6, "gymnasium.spaces.MultiDiscrete.sample"]], "sample() (gymnasium.spaces.text method)": [[6, "gymnasium.spaces.Text.sample"]], "seed() (gymnasium.spaces.box method)": [[6, "gymnasium.spaces.Box.seed"]], "seed() (gymnasium.spaces.discrete method)": [[6, "gymnasium.spaces.Discrete.seed"]], "seed() (gymnasium.spaces.multibinary method)": [[6, "gymnasium.spaces.MultiBinary.seed"]], "seed() (gymnasium.spaces.multidiscrete method)": [[6, "gymnasium.spaces.MultiDiscrete.seed"]], "seed() (gymnasium.spaces.text method)": [[6, "gymnasium.spaces.Text.seed"]], "flatdim() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.flatdim"]], "flatten() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.flatten"]], "flatten_space() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.flatten_space"]], "unflatten() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.unflatten"]], "batch_space() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.batch_space"]], "concatenate() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.concatenate"]], "create_empty_array() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.create_empty_array"]], "create_shared_memory() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.create_shared_memory"]], "iterate() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.iterate"]], "read_from_shared_memory() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.read_from_shared_memory"]], "write_to_shared_memory() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.write_to_shared_memory"]], "playplot (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayPlot"]], "playablegame (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayableGame"]], "callback() (gymnasium.utils.play.playplot method)": [[9, "gymnasium.utils.play.PlayPlot.callback"]], "capped_cubic_video_schedule() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.capped_cubic_video_schedule"]], "check_env() (in module gymnasium.utils.env_checker)": [[9, "gymnasium.utils.env_checker.check_env"]], "convert_to_done_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_done_step_api"]], "convert_to_terminated_truncated_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_terminated_truncated_step_api"]], "np_random() (in module gymnasium.utils.seeding)": [[9, "gymnasium.utils.seeding.np_random"]], "play() (in module gymnasium.utils.play)": [[9, "gymnasium.utils.play.play"]], "process_event() (gymnasium.utils.play.playablegame method)": [[9, "gymnasium.utils.play.PlayableGame.process_event"]], "save_video() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.save_video"]], "step_api_compatibility() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.step_api_compatibility"]], "asyncvectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.AsyncVectorEnv"]], "syncvectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.SyncVectorEnv"]], "vectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.VectorEnv"]], "action_space": [[10, "action_space"]], "close() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.close"]], "make() (in module gymnasium.vector)": [[10, "gymnasium.vector.make"]], "observation_space": [[10, "observation_space"]], "reset() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.reset"]], "single_action_space": [[10, "single_action_space"]], "single_observation_space": [[10, "single_observation_space"]], "step() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.step"]], "wrapper (class in gymnasium)": [[11, "gymnasium.Wrapper"]], "action_space (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.action_space"]], "close() (in module gymnasium.wrapper)": [[11, "gymnasium.Wrapper.close"]], "metadata (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.metadata"]], "np_random (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.np_random"]], "observation_space (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.observation_space"]], "reset() (in module gymnasium.wrapper)": [[11, "gymnasium.Wrapper.reset"]], "reward_range (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.reward_range"]], "spec (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.spec"]], "step() (in module gymnasium.wrapper)": [[11, "gymnasium.Wrapper.step"]], "unwrapped (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.unwrapped"]], "actionwrapper (class in gymnasium)": [[12, "gymnasium.ActionWrapper"]], "actionwrapper.action() (in module gymnasium.actionwrapper)": [[12, "gymnasium.ActionWrapper.ActionWrapper.action"]], "clipaction (class in gymnasium.wrappers)": [[12, "gymnasium.wrappers.ClipAction"]], "rescaleaction (class in gymnasium.wrappers)": [[12, "gymnasium.wrappers.RescaleAction"]], "ataripreprocessing (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.AtariPreprocessing"]], "autoresetwrapper (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.AutoResetWrapper"]], "envcompatibility (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.EnvCompatibility"]], "humanrendering (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.HumanRendering"]], "orderenforcing (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.OrderEnforcing"]], "passiveenvchecker (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.PassiveEnvChecker"]], "recordepisodestatistics (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.RecordEpisodeStatistics"]], "recordvideo (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.RecordVideo"]], "rendercollection (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.RenderCollection"]], "stepapicompatibility (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.StepAPICompatibility"]], "timelimit (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.TimeLimit"]], "vectorlistinfo (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.VectorListInfo"]], "filterobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.FilterObservation"]], "flattenobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.FlattenObservation"]], "framestack (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.FrameStack"]], "grayscaleobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.GrayScaleObservation"]], "normalizeobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.NormalizeObservation"]], "observationwrapper (class in gymnasium)": [[14, "gymnasium.ObservationWrapper"]], "pixelobservationwrapper (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.PixelObservationWrapper"]], "resizeobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.ResizeObservation"]], "timeawareobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.TimeAwareObservation"]], "transformobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.TransformObservation"]], "observation() (in module gymnasium.observationwrapper)": [[14, "gymnasium.ObservationWrapper.observation"]], "normalizereward (class in gymnasium.wrappers)": [[15, "gymnasium.wrappers.NormalizeReward"]], "rewardwrapper (class in gymnasium)": [[15, "gymnasium.RewardWrapper"]], "rewardwrapper.reward() (in module gymnasium.rewardwrapper)": [[15, "gymnasium.RewardWrapper.RewardWrapper.reward"]], "transformreward (class in gymnasium.wrappers)": [[15, "gymnasium.wrappers.TransformReward"]]}})