Files
Gymnasium/searchindex.js
2022-10-16 13:56:17 +00:00

1 line
184 KiB
JavaScript

Search.setIndex({"docnames": ["404", "README", "api/env", "api/registry", "api/spaces", "api/spaces/composite", "api/spaces/fundamental", "api/spaces/utils", "api/spaces/vector_utils", "api/utils", "api/vector", "api/wrappers", "api/wrappers/action_wrappers", "api/wrappers/misc_wrappers", "api/wrappers/observation_wrappers", "api/wrappers/reward_wrappers", "content/basic_usage", "content/environment_creation", "content/gym_compatibility", "content/handling_timelimits", "content/vectorising", "environments/atari", "environments/atari/adventure", "environments/atari/air_raid", "environments/atari/alien", "environments/atari/amidar", "environments/atari/assault", "environments/atari/asterix", "environments/atari/asteroids", "environments/atari/atlantis", "environments/atari/bank_heist", "environments/atari/battle_zone", "environments/atari/beam_rider", "environments/atari/berzerk", "environments/atari/bowling", "environments/atari/boxing", "environments/atari/breakout", "environments/atari/carnival", "environments/atari/centipede", "environments/atari/chopper_command", "environments/atari/complete_list", "environments/atari/crazy_climber", "environments/atari/defender", "environments/atari/demon_attack", "environments/atari/double_dunk", "environments/atari/elevator_action", "environments/atari/enduro", "environments/atari/fishing_derby", "environments/atari/freeway", "environments/atari/frostbite", "environments/atari/gopher", "environments/atari/gravitar", "environments/atari/hero", "environments/atari/ice_hockey", "environments/atari/jamesbond", "environments/atari/journey_escape", "environments/atari/kangaroo", "environments/atari/krull", "environments/atari/kung_fu_master", "environments/atari/montezuma_revenge", "environments/atari/ms_pacman", "environments/atari/name_this_game", "environments/atari/phoenix", "environments/atari/pitfall", "environments/atari/pong", "environments/atari/pooyan", "environments/atari/private_eye", "environments/atari/qbert", "environments/atari/riverraid", "environments/atari/road_runner", "environments/atari/robotank", "environments/atari/seaquest", "environments/atari/skiing", "environments/atari/solaris", "environments/atari/space_invaders", "environments/atari/star_gunner", "environments/atari/tennis", "environments/atari/time_pilot", "environments/atari/tutankham", "environments/atari/up_n_down", "environments/atari/venture", "environments/atari/video_pinball", "environments/atari/wizard_of_wor", "environments/atari/zaxxon", "environments/box2d", "environments/box2d/bipedal_walker", "environments/box2d/car_racing", "environments/box2d/lunar_lander", "environments/classic_control", "environments/classic_control/acrobot", "environments/classic_control/cart_pole", "environments/classic_control/mountain_car", "environments/classic_control/mountain_car_continuous", "environments/classic_control/pendulum", "environments/mujoco", "environments/mujoco/ant", "environments/mujoco/half_cheetah", "environments/mujoco/hopper", "environments/mujoco/humanoid", "environments/mujoco/humanoid_standup", "environments/mujoco/inverted_double_pendulum", "environments/mujoco/inverted_pendulum", "environments/mujoco/pusher", "environments/mujoco/reacher", "environments/mujoco/swimmer", "environments/mujoco/walker2d", "environments/third_party_environments", "environments/toy_text", "environments/toy_text/blackjack", "environments/toy_text/cliff_walking", "environments/toy_text/frozen_lake", "environments/toy_text/taxi", "index"], "filenames": ["404.md", "README.md", "api/env.md", "api/registry.md", "api/spaces.md", "api/spaces/composite.md", "api/spaces/fundamental.md", "api/spaces/utils.md", "api/spaces/vector_utils.md", "api/utils.md", "api/vector.md", "api/wrappers.md", "api/wrappers/action_wrappers.md", "api/wrappers/misc_wrappers.md", "api/wrappers/observation_wrappers.md", "api/wrappers/reward_wrappers.md", "content/basic_usage.md", "content/environment_creation.md", "content/gym_compatibility.md", "content/handling_timelimits.md", "content/vectorising.md", "environments/atari.md", "environments/atari/adventure.md", "environments/atari/air_raid.md", "environments/atari/alien.md", "environments/atari/amidar.md", "environments/atari/assault.md", "environments/atari/asterix.md", "environments/atari/asteroids.md", "environments/atari/atlantis.md", "environments/atari/bank_heist.md", "environments/atari/battle_zone.md", "environments/atari/beam_rider.md", "environments/atari/berzerk.md", "environments/atari/bowling.md", "environments/atari/boxing.md", "environments/atari/breakout.md", "environments/atari/carnival.md", "environments/atari/centipede.md", "environments/atari/chopper_command.md", "environments/atari/complete_list.md", "environments/atari/crazy_climber.md", "environments/atari/defender.md", "environments/atari/demon_attack.md", "environments/atari/double_dunk.md", "environments/atari/elevator_action.md", "environments/atari/enduro.md", "environments/atari/fishing_derby.md", "environments/atari/freeway.md", "environments/atari/frostbite.md", "environments/atari/gopher.md", "environments/atari/gravitar.md", "environments/atari/hero.md", "environments/atari/ice_hockey.md", "environments/atari/jamesbond.md", "environments/atari/journey_escape.md", "environments/atari/kangaroo.md", "environments/atari/krull.md", "environments/atari/kung_fu_master.md", "environments/atari/montezuma_revenge.md", "environments/atari/ms_pacman.md", "environments/atari/name_this_game.md", "environments/atari/phoenix.md", "environments/atari/pitfall.md", "environments/atari/pong.md", "environments/atari/pooyan.md", "environments/atari/private_eye.md", "environments/atari/qbert.md", "environments/atari/riverraid.md", "environments/atari/road_runner.md", "environments/atari/robotank.md", "environments/atari/seaquest.md", "environments/atari/skiing.md", "environments/atari/solaris.md", "environments/atari/space_invaders.md", "environments/atari/star_gunner.md", "environments/atari/tennis.md", "environments/atari/time_pilot.md", "environments/atari/tutankham.md", "environments/atari/up_n_down.md", "environments/atari/venture.md", "environments/atari/video_pinball.md", "environments/atari/wizard_of_wor.md", "environments/atari/zaxxon.md", "environments/box2d.md", "environments/box2d/bipedal_walker.md", "environments/box2d/car_racing.md", "environments/box2d/lunar_lander.md", "environments/classic_control.md", "environments/classic_control/acrobot.md", "environments/classic_control/cart_pole.md", "environments/classic_control/mountain_car.md", "environments/classic_control/mountain_car_continuous.md", "environments/classic_control/pendulum.md", "environments/mujoco.md", "environments/mujoco/ant.md", "environments/mujoco/half_cheetah.md", "environments/mujoco/hopper.md", "environments/mujoco/humanoid.md", "environments/mujoco/humanoid_standup.md", "environments/mujoco/inverted_double_pendulum.md", "environments/mujoco/inverted_pendulum.md", "environments/mujoco/pusher.md", "environments/mujoco/reacher.md", "environments/mujoco/swimmer.md", "environments/mujoco/walker2d.md", "environments/third_party_environments.md", "environments/toy_text.md", "environments/toy_text/blackjack.md", "environments/toy_text/cliff_walking.md", "environments/toy_text/frozen_lake.md", "environments/toy_text/taxi.md", "index.md"], "titles": ["404 - Page Not Found", "Gymnasium-docs", "Env", "Registry", "Spaces", "Composite Spaces", "Fundamental Spaces", "Spaces Utils", "Spaces Vector Utils", "Utils", "Vector", "Wrappers", "Action Wrappers", "Misc Wrappers", "Observation Wrappers", "Reward Wrappers", "Basic Usage", "Make your own custom environment", "Compatibility with Gym", "Handling Time Limits", "Vectorizing your environments", "Atari", "Adventure", "Air Raid", "Alien", "Amidar", "Assault", "Asterix", "Asteroids", "Atlantis", "Bank Heist", "Battle Zone", "Beam Rider", "Berzerk", "Bowling", "Boxing", "Breakout", "Carnival", "Centipede", "Chopper Command", "Complete List - Atari", "Crazy Climber", "Defender", "Demon Attack", "Double Dunk", "Elevator Action", "Enduro", "FishingDerby", "Freeway", "Frostbite", "Gopher", "Gravitar", "Hero", "IceHockey", "Jamesbond", "JourneyEscape", "Kangaroo", "Krull", "Kung Fu Master", "Montezuma Revenge", "Ms Pacman", "Name This Game", "Phoenix", "Pitfall", "Pong", "Pooyan", "PrivateEye", "Qbert", "Riverraid", "Road Runner", "Robot Tank", "Seaquest", "Skiings", "Solaris", "SpaceInvaders", "StarGunner", "Tennis", "TimePilot", "Tutankham", "Up n\u2019 Down", "Venture", "Video Pinball", "Wizard of Wor", "Zaxxon", "Box2D", "Bipedal Walker", "Car Racing", "Lunar Lander", "Classic Control", "Acrobot", "Cart Pole", "Mountain Car", "Mountain Car Continuous", "Pendulum", "MuJoCo", "Ant", "Half Cheetah", "Hopper", "Humanoid", "Humanoid Standup", "Inverted Double Pendulum", "Inverted Pendulum", "Pusher", "Reacher", "Swimmer", "Walker2D", "Third-Party Environments", "Toy Text", "Blackjack", "Cliff Walking", "Frozen Lake", "Taxi", "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments"], "terms": {"thi": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 109, 110, 111], "folder": [1, 9, 13, 102, 103], "contain": [1, 2, 4, 7, 8, 10, 11, 13, 14, 17, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 95, 96, 97, 98, 102, 103, 104, 105, 106, 108, 111], "If": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 21, 27, 30, 35, 38, 47, 48, 49, 50, 51, 65, 72, 76, 85, 86, 87, 92, 95, 97, 98, 99, 103, 105, 108, 109, 110], "you": [1, 2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 95, 98, 99, 102, 103, 106], "ar": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 111], "pleas": [1, 2, 9, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111], "pr": [1, 106], "repo": [1, 21, 106], "otherwis": [1, 2, 3, 5, 6, 9, 10, 13, 14, 20, 21, 34, 106], "follow": [1, 3, 4, 9, 11, 12, 13, 15, 16, 17, 19, 20, 21, 34, 44, 46, 47, 48, 49, 50, 51, 76, 89, 90, 91, 92, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 110], "below": [1, 6, 11, 19, 47, 85, 87, 93, 102, 105], "directli": [1, 5, 11, 13, 16, 17, 20, 89, 106], "markdown": 1, "file": [1, 17, 89, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "repositori": [1, 11, 94, 106], "fork": [1, 106, 112], "docstr": 1, "": [1, 2, 5, 6, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 21, 41, 47, 48, 49, 50, 51, 53, 54, 57, 58, 59, 64, 65, 67, 84, 85, 86, 87, 88, 89, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 110, 111, 112], "python": [1, 3, 8, 13, 17, 85, 86, 87, 106, 107, 112], "Then": [1, 11, 12, 16, 71, 104], "pip": [1, 17, 21, 84, 88, 94], "instal": [1, 9, 13, 17, 29, 84, 88, 94], "your": [1, 2, 10, 11, 12, 13, 14, 15, 16, 24, 25, 27, 29, 30, 32, 34, 35, 36, 38, 44, 46, 47, 48, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 64, 66, 67, 68, 69, 70, 71, 72, 73, 74, 77, 78, 79, 80, 81, 82, 83, 86, 95, 98, 99], "run": [1, 2, 3, 10, 13, 16, 17, 20, 30, 52, 55, 63, 68, 69, 72, 73, 85, 87, 89, 95, 96, 97, 98, 99, 100, 101, 104, 105, 106], "script": 1, "gen_md": 1, "py": [1, 8, 17, 18, 21, 85, 86, 87, 94, 95, 98, 99, 109], "automat": [1, 2, 3, 10, 11, 13, 17, 20, 106], "gener": [1, 2, 4, 5, 6, 9, 10, 11, 13, 14, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 109, 110, 111, 112], "For": [1, 2, 6, 7, 9, 11, 13, 14, 16, 17, 18, 20, 21, 22, 24, 25, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 42, 52, 53, 54, 55, 56, 57, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 86, 87, 110, 111], "add": [1, 3, 9, 10, 14, 16, 17, 86, 94, 98, 99, 106, 111], "complet": [1, 11, 13, 16, 19, 21, 41, 54, 66, 67, 86, 87], "ensur": [1, 2, 3, 5, 7, 9, 16, 17], "i": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 109, 110, 111], "ha": [1, 2, 4, 6, 7, 9, 11, 13, 14, 15, 16, 17, 19, 20, 21, 51, 71, 85, 86, 87, 88, 94, 95, 96, 97, 98, 99, 102, 103, 104, 105, 106, 108, 110, 112], "properli": [1, 4, 20], "format": [1, 4, 9, 11, 13, 14, 16], "md": [1, 17], "correspond": [1, 2, 3, 16, 17, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 87, 89, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 111], "gif": [1, 89], "_static": 1, "video": [1, 11, 40, 70, 85], "env_typ": 1, "where": [1, 3, 5, 6, 7, 9, 11, 13, 14, 16, 17, 19, 20, 21, 44, 86, 89, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 110, 111], "categori": 1, "e": [1, 2, 4, 6, 7, 8, 10, 11, 13, 14, 16, 17, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 102, 103, 106, 108], "g": [1, 2, 4, 6, 7, 8, 10, 11, 16, 17, 20, 72, 89, 93, 106, 110, 111], "mujoco": [1, 11, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106], "snake_cas": 1, "name": [1, 3, 11, 17, 40, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "convent": [1, 2, 21], "altern": [1, 20, 21, 106], "gen_gif": 1, "index": [1, 8, 9, 13, 14, 16, 21, 90, 99, 109], "toctre": 1, "requir": [1, 2, 4, 14, 16, 20, 94, 106], "packag": [1, 13, 106], "r": [1, 6, 13, 15, 70, 89, 93, 111], "txt": 1, "To": [1, 3, 8, 10, 13, 14, 15, 16, 17, 20, 21, 29, 39, 67, 85, 86, 87, 89, 111], "onc": [1, 13, 17, 28, 38, 45, 52, 100, 103, 111], "cd": [1, 17], "make": [1, 2, 5, 9, 11, 12, 13, 14, 15, 16, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111, 112], "dirhtml": 1, "_build": 1, "rebuild": [1, 29], "everi": [1, 9, 13, 16, 17, 38, 39, 43, 48, 70, 71, 80, 86, 87, 90, 95, 97, 98, 105, 106], "time": [1, 2, 3, 5, 9, 10, 11, 16, 17, 21, 37, 40, 43, 44, 45, 49, 53, 55, 56, 63, 67, 68, 69, 70, 71, 72, 85, 86, 93, 95, 96, 97, 98, 99, 104, 105, 106, 109], "chang": [1, 2, 8, 9, 10, 11, 13, 14, 15, 17, 18, 21, 49, 57, 67, 86, 89, 90, 91, 92, 93, 94, 102, 103, 106, 111], "made": [1, 16, 102, 103], "sphinx": 1, "autobuild": 1, "b": [1, 6, 102, 103, 111], "class": [2, 4, 5, 6, 9, 10, 11, 12, 13, 14, 15, 16, 17, 20, 94], "The": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111, 112], "main": [2, 20, 87, 97, 105], "reinforc": [2, 4, 19, 20, 89, 104, 107, 108, 109, 111], "learn": [2, 4, 5, 13, 14, 15, 17, 20, 21, 47, 48, 49, 50, 51, 85, 86, 87, 89, 90, 91, 92, 96, 99, 100, 101, 104, 107, 108, 109, 111], "agent": [2, 4, 11, 13, 14, 16, 17, 19, 20, 21, 45, 54, 85, 86, 87, 91, 95, 96, 97, 98, 99, 100, 101, 104, 105, 109, 110, 111], "encapsul": 2, "an": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 102, 103, 104, 105, 106, 108, 109, 111], "arbitrari": [2, 3, 6, 9, 14, 15, 106], "behind": [2, 65], "scene": [2, 65, 106], "dynam": [2, 21, 36, 47, 48, 49, 50, 51, 89, 93, 94, 100, 106], "through": [2, 3, 4, 10, 16, 19, 21, 36, 52, 55, 58, 59, 63, 72, 73, 98, 99, 106], "step": [2, 3, 10, 11, 12, 13, 14, 15, 19, 20, 21, 85, 87, 89, 90, 93, 106, 109, 111, 112], "reset": [2, 3, 9, 10, 11, 12, 13, 14, 15, 16, 20, 89, 90, 91, 92, 93, 106, 111, 112], "function": [2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 87, 93, 103, 106, 110, 111, 112], "can": [2, 3, 4, 5, 6, 9, 10, 11, 12, 13, 14, 15, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 110, 111], "partial": 2, "fulli": [2, 106], "observ": [2, 4, 5, 8, 9, 10, 11, 12, 13, 15, 16, 19, 106, 112], "singl": [2, 4, 5, 6, 7, 8, 9, 10, 14, 17, 20, 97, 98, 99, 105], "multi": [2, 6, 94, 98, 99, 102], "see": [2, 4, 9, 10, 16, 17, 18, 20, 21, 22, 25, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 42, 52, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 87, 89, 95, 96, 97, 98, 104, 105, 106], "pettingzoo": 2, "api": [2, 11, 13, 17, 19, 106], "user": [2, 3, 10, 16, 17, 21, 89, 90, 91, 92, 93, 106, 112], "need": [2, 3, 4, 5, 9, 11, 12, 13, 14, 16, 17, 19, 39, 41, 46, 52, 56, 66, 71, 85, 87, 90, 94], "know": [2, 13, 17], "updat": [2, 9, 13, 14, 17, 18, 19, 111], "action": [2, 3, 4, 5, 6, 9, 10, 11, 13, 16, 17, 40, 88, 106, 107, 112], "return": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105, 106, 109, 111], "next": [2, 8, 41, 43, 45], "reward": [2, 3, 9, 10, 11, 13, 16, 17, 19, 20, 94, 106, 112], "take": [2, 3, 6, 7, 9, 10, 11, 12, 13, 16, 20, 21, 74, 88, 90, 92, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 110, 111], "termin": [2, 3, 9, 10, 11, 13, 15, 16, 17, 18, 20, 89, 90, 91, 92, 95, 97, 98, 99, 100, 101, 102, 103, 105, 109, 112], "truncat": [2, 3, 9, 10, 11, 13, 15, 16, 17, 18, 20, 89, 90, 91, 92, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 112], "due": [2, 19, 110], "latest": 2, "inform": [2, 4, 5, 6, 9, 10, 11, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 109, 110, 111], "from": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 19, 20, 21, 23, 37, 44, 49, 50, 53, 55, 64, 65, 77, 83, 85, 86, 87, 89, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 109, 110, 111], "about": [2, 9, 14, 16, 17, 19, 20, 66, 89, 95, 98, 99], "metric": [2, 9], "debug": [2, 4, 9, 107], "info": [2, 9, 10, 11, 14, 15, 16, 17, 19, 20, 95, 96, 97, 98, 102, 103, 104, 105, 112], "initi": [2, 3, 5, 6, 10, 11, 12, 13, 14, 15, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 87, 88, 89, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 109, 110, 111], "state": [2, 11, 13, 14, 16, 19, 21, 88, 94, 106, 107, 109, 111], "befor": [2, 3, 9, 10, 11, 12, 13, 14, 15, 16, 17, 29, 41, 55, 66, 73, 74, 86, 95, 96, 97, 98, 99, 100, 101, 103, 104, 105], "call": [2, 3, 7, 9, 10, 11, 12, 13, 14, 16, 17, 20, 21, 34, 53, 102, 103, 108, 110], "first": [2, 9, 10, 11, 13, 14, 16, 17, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 109, 110, 111], "episod": [2, 3, 9, 11, 14, 16, 17, 19, 20, 109, 111], "render": [2, 10, 11, 14, 16, 21, 84, 85, 95, 96, 97, 98, 99, 100, 101, 104, 105, 106], "help": [2, 4, 16, 24, 56, 59, 102, 106], "visualis": 2, "what": [2, 4, 13, 16, 21, 111], "exampl": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 86, 89, 106, 108, 109, 110], "mode": [2, 10, 11, 13, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "human": [2, 5, 11, 16, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 86, 98, 99, 102, 106, 112], "rgb_arrai": [2, 9, 11, 13, 14, 16, 17, 21], "ansi": [2, 17], "text": [2, 4, 5, 7, 106, 108, 109, 110, 111], "close": [2, 6, 9, 10, 11, 16, 41, 66, 95, 97, 98, 103, 105, 112], "import": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111, 112], "when": [2, 4, 5, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 19, 20, 21, 24, 37, 41, 42, 43, 45, 47, 48, 49, 50, 51, 53, 54, 68, 69, 70, 71, 74, 86, 87, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 109, 111], "extern": [2, 19, 95, 98, 99], "softwar": [2, 106], "us": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 109, 110, 111], "pygam": [2, 9, 16, 17, 84, 106], "databas": 2, "have": [2, 3, 6, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 27, 29, 30, 34, 36, 38, 39, 41, 42, 47, 48, 49, 50, 51, 52, 55, 56, 57, 61, 63, 65, 71, 73, 84, 85, 86, 89, 95, 96, 97, 98, 99, 101, 102, 104, 105, 106, 108, 111], "understand": [2, 7, 10, 102, 106], "action_spac": [2, 9, 10, 11, 12, 14, 15, 16, 17, 20, 111], "space": [2, 9, 10, 11, 12, 13, 14, 17, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 94, 106, 107, 109, 111], "object": [2, 4, 8, 11, 16, 20, 22, 27, 41, 47, 48, 56, 68, 74, 102, 106], "valid": [2, 3, 4, 6, 8, 10, 11, 12, 13, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "all": [2, 5, 6, 10, 11, 13, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 48, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 86, 87, 88, 89, 90, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 109], "should": [2, 4, 6, 9, 10, 13, 14, 16, 17, 20, 102, 103], "within": [2, 4, 12, 14, 18, 59, 63, 87, 88, 100, 101, 106], "observation_spac": [2, 5, 6, 10, 11, 14, 16, 17, 20], "reward_rang": [2, 11, 15], "A": [2, 4, 5, 6, 7, 9, 10, 12, 13, 14, 15, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 89, 90, 92, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105, 110], "tupl": [2, 4, 6, 7, 8, 9, 11, 14, 16, 17, 20, 21, 95, 97, 98, 105, 108, 111], "minimum": [2, 6, 93], "maximum": [2, 3, 6, 9, 13, 16, 17, 70, 71, 87, 89, 93, 100, 106], "possibl": [2, 5, 6, 7, 16, 17, 18, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 87, 89, 90, 91, 92, 96, 98, 100, 101, 104, 105, 106, 109, 110, 111], "over": [2, 8, 13, 15, 16, 20, 24, 30, 53, 63, 68, 96, 98, 108, 110], "default": [2, 3, 4, 5, 6, 9, 10, 11, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 86, 89, 93, 95, 96, 97, 98, 102, 103, 104, 105, 106], "rang": [2, 8, 9, 11, 12, 13, 15, 16, 17, 18, 21, 53, 85, 88, 89, 90, 91, 92, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 112], "set": [2, 5, 6, 10, 11, 12, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 79, 80, 81, 82, 84, 87, 88, 89, 91, 92, 94, 95, 96, 97, 98, 102, 103, 104, 105, 106], "infti": [2, 6], "spec": [2, 10, 11, 13], "metadata": [2, 9, 11, 13, 17, 21], "fp": [2, 9, 17, 21], "np_random": [2, 9, 11, 13, 17], "random": [2, 4, 5, 6, 9, 13, 14, 16, 17, 20, 21, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 103, 104, 105, 106, 110, 111], "number": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 14, 16, 17, 18, 20, 21, 23, 24, 25, 26, 27, 28, 29, 32, 33, 34, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 55, 58, 60, 61, 62, 64, 65, 67, 70, 72, 74, 75, 77, 78, 79, 81, 82, 86, 87, 89, 97, 98, 99, 104, 105, 108, 110], "assign": [2, 72, 90, 91, 92, 102, 103], "dure": [2, 5, 6, 10, 11, 13, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 89, 95, 96, 97, 98, 104, 105, 111], "super": [2, 11, 12, 14, 15, 17, 20], "seed": [2, 3, 4, 5, 6, 10, 16, 17, 69, 112], "assess": 2, "self": [2, 4, 5, 11, 12, 13, 14, 15, 17, 20, 92, 106], "modifi": [2, 4, 10, 11, 12, 14, 15, 16, 17, 89, 102, 103, 106, 111], "extend": [2, 106], "wrapper": [2, 3, 5, 6, 9, 10, 18, 20, 102, 103, 106, 112], "acttyp": [2, 9, 11], "obstyp": [2, 9, 11], "float": [2, 3, 7, 9, 11, 12, 14, 15, 17, 20, 21, 52, 65, 87, 95, 96, 97, 98, 104, 105, 106], "bool": [2, 3, 4, 6, 9, 10, 11, 13, 14, 17, 20, 21, 87, 95, 96, 97, 98, 104, 105], "dict": [2, 4, 6, 7, 8, 9, 10, 11, 13, 14, 16, 17, 20], "one": [2, 5, 6, 7, 9, 10, 11, 13, 14, 16, 19, 20, 23, 24, 25, 29, 34, 41, 44, 45, 57, 66, 67, 68, 70, 71, 76, 89, 90, 91, 92, 93, 95, 97, 99, 100, 101, 103, 104, 106, 108, 111], "timestep": [2, 13, 14, 16, 17, 91, 92, 95, 97, 98, 99, 100, 101, 102, 103, 105], "end": [2, 11, 13, 16, 19, 20, 29, 38, 39, 41, 43, 45, 46, 54, 55, 56, 66, 70, 73, 74, 85, 93, 106, 109, 111], "reach": [2, 11, 17, 19, 29, 31, 41, 44, 45, 62, 65, 73, 74, 88, 89, 90, 91, 92, 95, 97, 98, 99, 100, 101, 102, 103, 105, 106, 109, 110, 111], "necessari": [2, 4, 21, 47, 48, 49, 50, 51], "version": [2, 3, 4, 11, 17, 19, 20, 90, 106], "0": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 109, 110, 111], "26": [2, 16, 17, 18, 19, 95, 98, 99], "wa": [2, 9, 10, 11, 14, 15, 16, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 95, 96, 97, 98, 104, 105, 106], "remov": [2, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 89, 111], "done": [2, 3, 9, 11, 13, 16, 17, 18, 19, 95, 97, 98, 99, 100, 101, 105], "favor": 2, "clearer": 2, "had": 2, "which": [2, 3, 4, 5, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 41, 43, 45, 59, 86, 87, 89, 90, 94, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105, 106, 110, 111], "critic": [2, 13], "bootstrap": [2, 19], "algorithm": [2, 4, 19, 20, 94, 107, 111], "paramet": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 104, 105], "provid": [2, 4, 5, 6, 9, 10, 11, 12, 13, 14, 16, 17, 18, 20, 21, 27, 41, 43, 47, 48, 49, 50, 51, 85, 89, 106], "element": [2, 4, 5, 6, 8, 10, 14, 16, 17, 20, 90, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 110], "numpi": [2, 4, 6, 8, 10, 11, 12, 14, 16, 17, 106, 109], "arrai": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 17, 20, 87, 106], "posit": [2, 5, 6, 7, 8, 9, 13, 14, 16, 17, 20, 21, 32, 53, 85, 86, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 109, 110, 111], "veloc": [2, 5, 7, 8, 16, 20, 85, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "pole": [2, 72, 88, 100, 101, 106], "cartpol": [2, 3, 9, 10, 13, 14, 15, 16, 20, 88, 90, 100, 101, 106], "result": [2, 7, 9, 10, 89, 95, 98, 99, 106, 107, 109, 111], "whether": [2, 3, 6, 9, 13, 17, 19, 20, 34, 87, 95, 96, 97, 98, 104, 105, 108], "defin": [2, 4, 7, 11, 12, 13, 14, 15, 16, 17, 19, 20, 93, 98, 112], "under": [2, 14, 15, 106], "mdp": [2, 13, 16, 91, 92], "task": [2, 5, 11, 14, 16, 17, 19, 57, 63, 66, 86, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 109], "neg": [2, 6, 9, 16, 72, 92, 95, 96, 98, 99, 100, 102, 103], "goal": [2, 16, 17, 24, 27, 32, 34, 36, 38, 41, 53, 58, 59, 60, 61, 62, 64, 67, 69, 71, 72, 78, 79, 80, 81, 82, 83, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 109, 110, 111], "move": [2, 11, 15, 17, 19, 23, 26, 27, 36, 37, 51, 54, 65, 68, 71, 72, 85, 87, 90, 95, 96, 97, 99, 100, 101, 102, 103, 104, 105, 106, 109, 110, 111], "lava": [2, 52], "sutton": [2, 89, 90, 100, 101, 108, 109], "barton": 2, "gridworld": [2, 17, 109], "true": [2, 3, 7, 9, 10, 12, 13, 14, 16, 17, 20, 21, 47, 48, 49, 50, 51, 85, 86, 87, 95, 96, 97, 98, 104, 105, 108, 110], "condit": [2, 16, 19], "outsid": [2, 19, 86, 87], "scope": [2, 19], "satisfi": 2, "typic": [2, 9, 106, 111], "timelimit": [2, 3, 11, 13, 16, 17, 19], "could": [2, 9, 14, 15, 17, 19, 21, 106], "also": [2, 3, 6, 9, 10, 11, 13, 14, 16, 17, 19, 21, 33, 54, 55, 66, 67, 69, 85, 86, 87, 88, 94, 95, 96, 97, 98, 104, 105, 106], "indic": [2, 9, 13, 19, 20, 86, 89, 90, 95, 98, 99, 111], "physic": [2, 84, 94, 100, 101, 106], "go": [2, 19, 20, 45, 72, 76, 86, 108], "out": [2, 8, 17, 19, 21, 30, 35, 52, 55, 63, 68, 73], "bound": [2, 6, 11, 12, 16, 19, 87, 89, 90, 91, 92, 93], "prematur": 2, "auxiliari": [2, 17], "diagnost": 2, "log": 2, "might": [2, 4, 6, 7, 11, 12, 13, 14, 15, 16, 17, 20, 106], "instanc": [2, 3, 4, 5, 7, 8, 9, 10, 11, 13, 15, 16, 20, 106], "describ": [2, 5, 16, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 89, 90, 104, 106, 108], "perform": [2, 9, 13, 16, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 103, 106], "variabl": [2, 4, 6, 10, 13, 17, 19, 97, 104, 105, 106], "hidden": [2, 94, 106], "individu": [2, 11, 17, 20, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "term": [2, 11, 17, 88, 89, 94, 95, 96, 97, 98, 102, 103, 104, 105], "combin": [2, 4, 9, 11, 16, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 103], "produc": [2, 11, 13, 16, 17, 99], "total": [2, 41, 85, 86, 87, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105, 111], "In": [2, 6, 9, 10, 11, 12, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 86, 88, 89, 95, 96, 97, 98, 104, 105, 106, 109, 111], "openai": [2, 3, 10, 11, 19, 84, 112], "gym": [2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 84, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111, 112], "v26": 2, "distinguish": [2, 17, 19], "howev": [2, 3, 4, 5, 6, 7, 10, 11, 12, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 89, 95, 96, 97, 98, 102, 103, 111], "deprec": [2, 16], "favour": [2, 16], "boolean": [2, 4, 9, 13, 16, 20, 87], "valu": [2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 16, 19, 20, 21, 71, 85, 87, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 110, 111], "case": [2, 4, 5, 6, 11, 12, 14, 16, 17, 19, 20, 54, 66, 86, 95, 96, 97, 98, 104, 105, 111], "further": [2, 71, 87, 102, 103], "undefin": 2, "signal": [2, 11, 13, 16, 17, 19, 95, 97, 98, 105, 111], "mai": [2, 6, 9, 10, 12, 13, 14, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 95, 96, 97, 98, 104, 105, 110], "emit": [2, 11, 13], "differ": [2, 4, 5, 9, 10, 11, 12, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 86, 93, 95, 96, 97, 98, 99, 100, 101, 105, 106], "reason": [2, 87, 106], "mayb": 2, "underli": [2, 11, 13, 16, 89], "solv": [2, 17, 85, 88, 90, 94, 100, 101], "successfulli": 2, "certain": [2, 44, 46, 100, 101, 103], "exceed": [2, 11, 13, 16, 95, 97, 98, 105], "simul": [2, 21, 47, 48, 49, 50, 51, 94, 98, 99, 100, 101, 106], "enter": [2, 9, 16, 28, 30, 57, 87], "invalid": [2, 6], "option": [2, 3, 4, 5, 6, 9, 10, 11, 13, 14, 16, 17, 86, 89, 90, 91, 92, 93], "int": [2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 16, 17, 20, 21], "none": [2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14, 16, 17, 20, 110], "intern": [2, 10, 14], "new": [2, 4, 11, 12, 13, 14, 16, 17, 18, 19, 20, 25, 28, 30, 43, 89, 90, 91, 92, 93, 103, 106], "start": [2, 4, 6, 9, 10, 13, 16, 20, 31, 44, 45, 51, 55, 56, 71, 106, 108, 109, 110, 111], "often": [2, 4, 17, 94], "some": [2, 4, 5, 6, 10, 11, 13, 14, 15, 16, 17, 20, 21, 37, 45, 63, 86, 88, 89, 94, 103, 104, 106, 111], "explor": [2, 4, 51], "generalis": 2, "polici": [2, 14, 15, 19, 20, 88, 94, 95, 96, 97, 98, 99, 104, 105, 106, 112], "control": [2, 4, 6, 15, 16, 21, 23, 26, 28, 29, 30, 31, 32, 37, 39, 42, 49, 50, 51, 54, 56, 63, 64, 66, 68, 69, 70, 71, 72, 73, 76, 77, 84, 86, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "alreadi": [2, 11, 14, 16, 106], "rng": [2, 4, 5, 6, 17], "therefor": [2, 4, 10, 18], "right": [2, 6, 16, 17, 21, 23, 25, 26, 27, 28, 32, 36, 37, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 56, 58, 60, 61, 62, 64, 67, 72, 74, 75, 77, 78, 81, 82, 85, 86, 87, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 104, 105, 109, 110, 111], "after": [2, 3, 9, 10, 13, 14, 16, 17, 19, 20, 29, 33, 38, 44, 48, 52, 74, 87, 95, 96, 97, 98, 99, 104, 105, 106, 108, 111], "never": 2, "again": [2, 17, 87], "custom": [2, 4, 9, 10, 14, 16, 21, 47, 48, 49, 50, 51, 104, 106, 110], "line": [2, 17, 44, 89], "correctli": [2, 14, 15, 17], "v0": [2, 3, 10, 11, 13, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111], "25": [2, 21, 47, 48, 49, 50, 51, 95, 97, 98, 99, 105, 111], "return_info": 2, "now": [2, 16, 17, 19, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "expect": [2, 4, 5, 6, 10, 13], "prng": [2, 4, 5, 6], "doe": [2, 3, 5, 7, 9, 10, 11, 13, 16, 17, 18, 19, 33, 49, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108], "pass": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 86, 87, 95, 96, 97, 98, 104, 105], "chosen": [2, 6, 21], "sourc": [2, 17, 94, 106], "entropi": 2, "timestamp": 2, "dev": [2, 20], "urandom": 2, "integ": [2, 5, 6, 9, 13, 14, 17, 21, 111], "even": [2, 3, 17, 20, 22, 24, 30, 31, 33, 35, 38, 39, 42, 52, 53, 54, 56, 57, 59, 63, 66, 68, 69, 70, 71, 73, 76, 80, 83, 99], "exist": [2, 3, 4, 10, 11, 16, 18, 20], "usual": [2, 5, 6, 11, 13, 16, 17, 21, 47, 48, 49, 50, 51, 53, 97], "want": [2, 5, 10, 11, 12, 13, 15, 16, 17, 30, 52], "been": [2, 9, 13, 16, 17, 19, 95, 98, 99, 106], "refer": [2, 9, 13, 16, 17, 19], "minim": [2, 17, 19, 20], "abov": [2, 5, 6, 9, 16, 21, 47, 48, 49, 50, 51, 89, 90, 93, 94], "paradigm": 2, "specifi": [2, 4, 5, 6, 9, 11, 12, 13, 14, 15, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 87, 88, 93, 97, 98, 102, 103, 105, 106, 107, 110, 111], "how": [2, 4, 9, 10, 16, 17, 19, 20, 53, 55, 56, 99, 100, 102, 103, 106], "depend": [2, 5, 9, 14, 15, 21, 23, 24, 25, 26, 27, 28, 29, 32, 33, 34, 36, 37, 39, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 55, 56, 58, 60, 61, 62, 64, 65, 67, 72, 74, 75, 77, 78, 79, 81, 82, 84, 88, 90, 94, 95, 96, 97, 98, 104, 105, 106, 110], "specif": [2, 3, 6, 13, 16, 19, 106], "analog": [2, 21], "dictionari": [2, 4, 5, 9, 10, 11, 13, 14, 16, 17, 20, 111], "complement": 2, "It": [2, 3, 5, 6, 9, 10, 11, 13, 16, 17, 21, 22, 23, 24, 25, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 52, 53, 54, 55, 56, 57, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 79, 80, 81, 82, 85, 94, 95, 96, 97, 98, 99, 102, 103, 104, 105, 106, 109], "union": [2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 14], "renderfram": [2, 9], "list": [2, 4, 5, 6, 9, 10, 11, 14, 16, 20, 21, 106], "comput": [2, 9, 17, 64, 76, 95, 100, 102, 103, 106], "frame": [2, 9, 13, 14, 21, 34, 86, 87, 99, 102, 106], "render_mod": [2, 9, 10, 11, 13, 14, 16, 17, 21, 112], "wai": [2, 5, 11, 16, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 106], "most": [2, 4, 11, 13, 14, 16, 17, 20, 21, 47, 48, 49, 50, 51, 103], "achiev": [2, 21, 24, 89, 108], "appli": [2, 3, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 85, 87, 88, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108], "collect": [2, 10, 24, 27, 45, 59, 60, 63, 79, 106], "As": [2, 10, 11, 16, 77, 89, 94, 95, 96, 98, 99, 106, 107, 111], "known": [2, 13, 28, 106], "__init__": [2, 5, 8, 11, 12, 14, 15, 17, 20], "initialis": [2, 13], "By": [2, 3, 13, 16, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 89, 95, 96, 97, 98, 104, 105], "continu": [2, 4, 11, 12, 16, 19, 26, 27, 86, 87, 88, 91, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106], "current": [2, 6, 9, 11, 13, 14, 17, 18, 21, 86, 89, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111], "displai": [2, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 90, 106], "consumpt": 2, "occur": [2, 13, 16, 17, 20, 89, 90], "doesn": [2, 3, 11, 13, 18, 19, 21, 87], "t": [2, 3, 5, 6, 7, 9, 11, 13, 14, 15, 17, 18, 19, 21, 37, 47, 48, 49, 50, 51, 70, 71, 86, 87, 91, 92], "repres": [2, 5, 6, 9, 16, 17, 20, 87, 89, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 110, 111, 112], "np": [2, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 16, 17, 20, 87, 111], "ndarrai": [2, 3, 5, 6, 7, 8, 9, 12, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 111], "shape": [2, 4, 5, 6, 7, 8, 11, 12, 13, 14, 16, 17, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "x": [2, 4, 6, 7, 17, 87, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105, 106], "y": [2, 6, 21, 87, 93, 95, 96, 98, 99, 100, 102, 103, 104, 111], "3": [2, 5, 6, 7, 8, 9, 10, 13, 14, 16, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 109, 110, 111], "rgb": [2, 11, 13, 14, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 86, 95, 96, 97, 98, 99, 100, 101, 104, 105], "pixel": [2, 11, 17, 86, 106], "imag": [2, 4, 10, 11, 13, 14, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 86, 106], "string": [2, 4, 6, 9, 14, 20], "str": [2, 3, 4, 5, 6, 7, 9, 10, 13, 14, 21, 95, 96, 97, 98, 104, 105], "stringio": [2, 107], "style": [2, 10, 13, 106], "represent": [2, 19], "each": [2, 3, 4, 5, 6, 9, 10, 11, 12, 14, 16, 17, 20, 21, 41, 43, 44, 45, 46, 49, 57, 64, 66, 67, 68, 69, 70, 71, 72, 84, 85, 87, 88, 89, 90, 91, 92, 95, 98, 99, 100, 101, 102, 106, 107, 109, 111], "includ": [2, 3, 14, 17, 18, 19, 20, 21, 90, 95, 96, 97, 98, 100, 101, 102, 103, 104, 105, 106, 111], "newlin": 2, "escap": [2, 40, 55, 59], "sequenc": [2, 3, 4, 6, 7, 10, 14, 21, 106], "color": [2, 5, 25, 36, 49, 67], "rgb_array_list": [2, 9, 11, 13], "ansi_list": 2, "base": [2, 4, 5, 10, 11, 12, 13, 14, 15, 16, 17, 45, 54, 71, 84, 89, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 111], "except": [2, 16, 17, 68, 71], "rendercollect": [2, 11, 13], "pop": [2, 16, 103], "sure": [2, 13, 16, 17], "kei": [2, 3, 4, 5, 6, 9, 10, 11, 13, 14, 16, 17, 19, 20, 21, 22, 53, 95, 96, 97, 98, 102, 103, 104, 105, 106, 111], "support": [2, 4, 5, 7, 9, 10, 11, 13, 14, 16, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 89, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106], "longer": [2, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 95, 97, 98, 99, 100, 101, 102, 103, 105, 106], "accept": [2, 9, 13, 17, 21], "rather": [2, 86, 106], "v1": [2, 3, 9, 10, 13, 14, 15, 16, 20, 85, 86, 87, 89, 90, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 110, 111], "type": [2, 4, 5, 6, 10, 11, 12, 14, 16, 17, 20, 43, 86, 95, 96, 97, 98, 104, 105, 106], "discret": [2, 4, 5, 7, 8, 10, 12, 14, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 86, 87, 89, 90, 91, 92, 106, 107, 108, 109, 110, 111], "give": [2, 24, 25, 43, 44, 87, 102, 108, 111], "2": [2, 5, 6, 7, 8, 9, 10, 12, 14, 15, 16, 17, 20, 21, 22, 23, 25, 26, 27, 28, 29, 31, 32, 34, 36, 37, 39, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55, 58, 60, 61, 62, 64, 65, 67, 72, 74, 75, 76, 77, 78, 79, 81, 82, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 109, 110, 111], "mean": [2, 16, 17, 20, 89, 95, 96, 97, 102], "two": [2, 5, 6, 9, 10, 13, 16, 17, 20, 21, 23, 34, 76, 85, 87, 89, 91, 92, 94, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105, 108], "1": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111], "box": [2, 4, 5, 7, 8, 10, 11, 12, 14, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106], "4028234663852886e": 2, "38": [2, 98, 99], "4": [2, 6, 7, 9, 10, 11, 12, 13, 14, 16, 17, 20, 21, 23, 25, 26, 27, 28, 30, 32, 34, 36, 37, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 58, 60, 61, 62, 64, 65, 66, 67, 74, 75, 77, 78, 79, 81, 82, 85, 87, 89, 90, 91, 92, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 109, 110, 111], "float32": [2, 5, 6, 7, 8, 10, 11, 12, 14, 16, 20, 85, 86, 87, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "denot": [2, 90], "we": [2, 6, 13, 14, 15, 16, 17, 18, 19, 20, 21, 95, 98, 99, 106], "check": [2, 6, 13, 17, 18, 111], "well": [2, 4, 17, 20, 28, 71, 89, 95, 98, 99, 106], "high": [2, 5, 6, 7, 8, 10, 14, 16, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106], "8000002e": 2, "00": 2, "4028235e": 2, "1887903e": 2, "01": [2, 15, 87, 95, 96, 99, 100, 101, 102, 103, 104], "dtype": [2, 4, 5, 6, 8, 10, 14, 16, 17, 20, 87], "low": [2, 5, 6, 7, 8, 14, 16, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106], "ani": [2, 4, 5, 8, 9, 13, 14, 16, 17, 19, 20, 21, 43, 47, 48, 49, 50, 51, 52, 70, 87, 90, 95, 97, 98, 99, 100, 101, 102, 103, 104, 105, 110], "etc": [2, 4, 11, 16, 17, 19, 20, 66, 69, 73, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "determin": [2, 6, 17, 19, 21, 87, 89, 90, 91, 92, 93, 106], "inf": [2, 14, 90, 91, 92, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "envspec": [2, 3], "normal": [2, 6, 11, 13, 85, 86, 93, 95, 96, 100], "finish": [2, 86, 87], "code": [2, 4, 5, 9, 10, 11, 13, 14, 15, 16, 17, 20, 89, 106], "clean": 2, "up": [2, 5, 6, 10, 14, 16, 17, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32, 34, 37, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 54, 55, 58, 60, 65, 67, 68, 69, 71, 72, 75, 76, 77, 78, 81, 82, 85, 87, 94, 95, 98, 99, 103, 108, 109, 110, 111], "window": [2, 9, 16, 17, 41, 86, 106], "http": [2, 9, 11, 17, 21, 86, 89, 106, 108, 109], "connect": [2, 5, 89, 95, 96, 97, 103, 104, 105], "properti": [2, 4, 11, 19, 20], "unwrap": [2, 11, 16, 89], "non": [2, 4, 7, 9, 17, 19], "wrap": [2, 3, 9, 10, 11, 12, 13, 14, 15, 16, 17, 20], "_np_random": 2, "meth": [2, 18], "much": [2, 17, 19, 21, 47, 48, 49, 50, 51, 55, 56, 99], "creat": [2, 3, 6, 8, 9, 10, 13, 16, 31, 85, 86, 87, 102, 103, 106, 107], "more": [2, 4, 5, 6, 9, 10, 11, 14, 16, 17, 19, 20, 21, 22, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 42, 47, 52, 53, 54, 55, 56, 57, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 85, 87, 94, 95, 98, 99, 100, 101, 102, 103, 104, 106], "creation": [2, 10, 17], "tutori": 2, "gymnasium": [3, 4, 5, 6, 7, 8, 9, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111], "allow": [3, 4, 5, 9, 11, 12, 14, 15, 16, 17, 21, 52, 70, 89, 90, 91, 92, 93, 100, 101, 102, 103], "load": 3, "pre": 3, "sever": [3, 6, 11, 13, 21, 51, 106], "id": [3, 10, 16, 17, 18, 110], "kwarg": [3, 9, 10, 11, 17, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "env": [3, 9, 11, 12, 13, 14, 15, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 109, 110, 111, 112], "liter": 3, "mountaincar": [3, 20, 91], "mountaincarcontinu": [3, 92], "supportsfloat": [3, 6, 11], "pendulum": [3, 10, 14, 20, 88, 89, 90, 94], "acrobot": [3, 88, 106], "lunarland": [3, 13, 16, 87, 106, 112], "v2": [3, 12, 13, 16, 85, 86, 87, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 111, 112], "lunarlandercontinu": [3, 12], "bipedalwalk": [3, 11, 12, 16, 85], "v3": [3, 11, 12, 16, 85, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 111], "bipedalwalkerhardcor": 3, "carrac": [3, 9, 14, 86], "blackjack": [3, 107], "frozenlak": [3, 9, 20, 110], "frozenlake8x8": 3, "cliffwalk": [3, 109], "taxi": [3, 107], "reacher": [3, 11, 94, 102], "v4": [3, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "pusher": 3, "invertedpendulum": [3, 94, 100, 101], "inverteddoublependulum": [3, 100], "halfcheetah": [3, 94, 96], "hopper": [3, 94, 105], "swimmer": [3, 94], "walker2d": [3, 94], "ant": [3, 94, 97, 105], "humanoidstandup": [3, 94, 99], "humanoid": [3, 42, 94, 95], "accord": [3, 5, 6, 10, 87], "given": [3, 6, 11, 14, 19, 20, 68, 71, 85, 87, 88, 89, 91, 92, 95, 97, 98, 105], "find": [3, 17, 21, 22, 47, 48, 49, 50, 51, 57, 66, 78, 100, 103, 106], "avail": [3, 16, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 87, 106], "modul": [3, 8, 17], "eg": [3, 9, 17, 106], "max_episode_step": [3, 13, 17], "length": [3, 5, 6, 9, 11, 13, 14, 20, 85, 89, 90, 91, 92, 96, 104, 106], "autoreset": [3, 10, 17], "autoresetwrapp": [3, 11, 13, 17], "apply_api_compat": [3, 13, 16, 18], "stepapicompat": [3, 11, 13, 16, 18], "convert": [3, 4, 5, 11, 13, 14, 18, 86, 106], "argument": [3, 4, 5, 6, 7, 9, 10, 14, 16, 17, 84, 88, 107], "fals": [3, 9, 10, 13, 14, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 86, 87, 95, 96, 97, 98, 104, 105, 108, 110], "disable_env_check": [3, 10], "checker": [3, 10], "addit": [3, 4, 10, 11, 13, 17, 21, 27, 38, 68, 72, 87, 88, 89, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 111], "constructor": [3, 4, 5, 6, 9, 11, 16, 17], "rais": [3, 6, 7, 8, 9, 10, 13, 14, 20, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "error": [3, 6, 9, 11, 13, 19, 20], "entry_point": [3, 17], "callabl": [3, 8, 9, 10, 13, 14, 15, 20], "reward_threshold": [3, 17, 95, 96, 97, 98, 99, 102, 103, 104, 105], "nondeterminist": [3, 17], "order_enforc": [3, 17], "syntax": 3, "namespac": [3, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "env_nam": 3, "v": [3, 6, 70, 100], "keyword": [3, 5, 10, 14, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 108], "entri": 3, "point": [3, 7, 9, 11, 16, 19, 21, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 42, 43, 44, 45, 46, 48, 52, 53, 56, 63, 64, 65, 66, 67, 68, 69, 71, 73, 74, 75, 77, 78, 81, 85, 86, 87, 89, 90, 93, 103, 106, 108], "threshold": [3, 17, 89, 90, 111], "consid": [3, 14, 17, 86, 87, 88, 94, 95, 97, 98, 105, 106], "learnt": 3, "knowledg": 3, "limit": [3, 16, 37, 45, 52, 53, 66, 71, 100, 101], "enabl": [3, 11, 20, 21, 86, 106], "order": [3, 4, 5, 11, 16, 17, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 94, 95, 96, 97, 98, 99, 100, 101, 102, 105, 106], "enforc": 3, "correct": [3, 17, 19, 111], "disabl": [3, 13], "recommend": [3, 10, 13, 17, 21, 47, 48, 49, 50, 51, 87, 95, 98, 99, 106], "onli": [3, 4, 5, 6, 7, 10, 11, 12, 13, 14, 16, 17, 20, 21, 23, 25, 26, 27, 28, 29, 32, 34, 36, 37, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55, 58, 60, 61, 62, 64, 65, 67, 68, 69, 70, 71, 72, 74, 75, 77, 78, 79, 81, 82, 91, 92, 95, 96, 97, 98, 100, 102, 103, 105, 106], "env_id": 3, "retriev": [3, 13, 42, 45, 71], "global": 3, "superclass": [4, 12, 14, 15], "crucial": 4, "thei": [4, 10, 13, 14, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 103, 107, 108], "serv": [4, 95, 96, 97, 98, 104, 105], "variou": [4, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 99, 106], "purpos": [4, 106], "clearli": 4, "interact": [4, 9, 17, 21, 106], "environ": [4, 6, 8, 11, 12, 14, 15, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 107, 108, 109, 110, 111], "look": [4, 9, 11, 13, 15, 16, 17, 19, 21, 23, 25, 26, 27, 28, 29, 32, 34, 36, 37, 41, 43, 44, 45, 46, 55, 58, 60, 61, 62, 64, 65, 67, 70, 72, 74, 75, 77, 78, 79, 81, 82], "like": [4, 6, 9, 11, 12, 13, 14, 15, 16, 17, 20, 23, 24, 25, 26, 27, 28, 29, 30, 32, 34, 36, 37, 41, 43, 44, 45, 46, 55, 58, 60, 61, 62, 63, 64, 65, 66, 67, 72, 74, 75, 77, 78, 79, 81, 82, 85, 87, 95, 96, 98, 99, 101, 102, 103, 105, 106], "u": [4, 6, 11, 15, 17, 21, 106, 107], "work": [4, 9, 11, 13, 14, 21, 86, 87, 89, 96, 97, 100, 101, 105, 106], "highli": [4, 17, 21, 84, 88], "structur": [4, 5, 7, 17, 20, 106], "data": [4, 7, 9, 11, 16, 17, 20], "form": [4, 5, 6, 13, 17, 20, 89, 104], "painlessli": 4, "transform": [4, 7, 9, 11, 12, 13, 16, 103], "them": [4, 11, 13, 16, 21, 23, 24, 25, 28, 29, 33, 37, 44, 65, 74, 87, 96, 103, 106], "flat": [4, 5, 6, 7, 14], "sampl": [4, 5, 6, 7, 8, 9, 10, 14, 15, 16, 17, 20, 87, 111], "especi": [4, 15, 17, 20], "hierarch": [4, 111], "via": [4, 5, 11, 13, 14, 15, 16, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 88, 94, 106, 107], "build": [4, 11, 23, 41, 45, 100, 105, 106], "express": [4, 9, 95, 98, 99], "inherit": [4, 11, 12, 14, 15, 16, 17, 20], "cover": [4, 20], "note": [4, 8, 13, 16, 19, 20, 89, 90, 95, 98, 99, 111], "parametr": 4, "probabl": [4, 19, 21, 110, 111], "distribut": [4, 5, 6, 104], "batch": [4, 8, 10, 20], "vectorenv": [4, 20], "moreov": [4, 13, 17, 20, 21, 24, 34], "implement": [4, 5, 10, 12, 13, 14, 15, 16, 17, 18, 20, 21, 93, 100, 106, 107, 109], "handl": [4, 10, 16, 100], "care": [4, 20, 72], "immut": 4, "mask": [4, 5, 6, 20, 106, 111], "t_cov": 4, "randomli": [4, 5, 17, 87], "uniform": [4, 6, 20, 91, 92, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "bounded": 4, "int8": [4, 6], "member": [4, 55], "possibli": [4, 5, 6, 8, 11, 13, 16, 106], "subspac": [4, 5, 6, 7], "to_json": 4, "sample_n": 4, "jsonabl": 4, "from_json": 4, "complex": [4, 5, 98, 99, 100, 101, 106], "matric": 4, "multidiscret": [4, 5, 7, 8, 10, 16, 17, 20], "binari": [4, 6, 16, 17, 20], "hold": [4, 108], "down": [4, 6, 17, 19, 20, 21, 25, 27, 28, 34, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 54, 55, 58, 60, 62, 63, 65, 67, 75, 77, 78, 81, 82, 86, 99, 108, 109, 110], "button": [4, 6, 9], "multibinari": [4, 5, 7, 8, 16], "multipl": [4, 5, 6, 8, 10, 16, 20, 106], "ax": [4, 6, 17], "messag": [4, 106], "mission": [4, 54, 56, 57], "detail": [4, 9, 13, 16, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 89, 106], "join": 4, "togeth": [4, 20, 21, 94], "vectoris": 4, "separ": [4, 5, 16, 17], "readabl": [4, 5], "fix": [4, 5, 6, 11, 13, 15, 16, 17, 54, 89, 90, 93, 94, 95, 96, 97, 98, 100, 101, 105, 110, 111], "unord": 4, "entiti": 4, "select": [4, 6, 44, 95, 98, 99, 102, 103, 106], "graph": [4, 7], "node": [4, 5, 7], "edg": [4, 5, 7, 90], "flatten": [4, 7, 11, 17, 94, 109], "unflatten": [4, 7], "neural": [4, 7, 20, 89, 104, 106], "network": [4, 7, 20, 104, 106], "flatdim": [4, 7, 20], "dimens": [4, 6, 7, 14, 20, 95, 96, 97, 98, 104, 105, 106], "flatten_spac": [4, 7], "revers": [4, 7, 108], "size": [4, 13, 17, 20, 110], "batch_spac": [4, 8], "concaten": [4, 7, 8, 94], "iter": [4, 5, 8, 10], "create_empty_arrai": [4, 8], "create_shared_memori": [4, 8], "read_from_shared_memori": [4, 8], "write_to_shared_memori": [4, 8], "spaces_kwarg": 5, "constitu": 5, "usag": [5, 6, 7, 11, 86], "ordereddict": [5, 8, 14, 16], "nest": [5, 8, 20, 106], "ext_control": 5, "5": [5, 6, 7, 8, 12, 13, 16, 17, 20, 21, 23, 25, 26, 27, 28, 31, 32, 34, 37, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 55, 58, 60, 61, 62, 64, 65, 67, 74, 75, 77, 78, 79, 81, 82, 85, 86, 87, 89, 91, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105, 106, 108, 111], "inner_st": 5, "charg": 5, "100": [5, 7, 13, 20, 35, 45, 68, 69, 85, 86, 87, 89, 92, 97, 102, 106, 109], "system_check": 5, "10": [5, 6, 12, 17, 21, 28, 34, 47, 48, 49, 50, 51, 58, 65, 68, 71, 85, 87, 93, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105, 106, 108, 109, 111], "job_statu": 5, "progress": [5, 16, 77], "conveni": [5, 11, 16, 17, 20], "easili": [5, 11, 16, 106], "flattenobserv": [5, 11, 14, 17], "similar": [5, 17, 20, 25, 36, 102], "deal": 5, "instanti": [5, 9, 13, 14, 15, 17, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "either": [5, 6, 7, 9, 13, 20, 21, 44, 54, 91, 92, 108, 110], "avoid": [5, 8, 11, 16, 20, 21, 24, 25, 27, 32, 33, 41, 43, 59, 60, 62, 67, 69, 70, 75], "independ": [5, 6, 10, 20, 97, 103, 104, 105], "same": [5, 7, 9, 10, 14, 16, 19, 20, 53, 85, 86, 89, 102, 103, 104, 111], "attr": 5, "warn": [5, 9, 10, 13, 16], "guarante": [5, 21], "uniqu": [5, 84, 88, 94, 100], "sub": [5, 10, 71], "precis": 5, "cartesian": [5, 6, 93], "product": [5, 6], "03633198": 5, "42370757": 5, "involv": [5, 17, 84, 100, 101, 106, 110], "reproduc": [5, 16], "insid": [5, 6, 13, 17, 20], "method": [5, 9, 12, 13, 14, 15, 16, 17, 18, 20, 106, 111], "draw": [5, 17, 108], "42": [5, 6, 16, 90, 98, 99, 112], "54": 5, "finit": [5, 6, 12, 19, 95, 99, 100, 101, 102, 103, 105], "a_0": 5, "dot": [5, 6, 17, 20], "a_n": 5, "a_i": 5, "belong": [5, 8, 106], "n": [5, 6, 7, 8, 16, 20, 21, 40, 86, 89, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106], "0259352": 5, "80977976": 5, "80066574": 5, "77165383": 5, "must": [5, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 19, 20, 21, 22, 23, 26, 28, 29, 30, 31, 33, 37, 38, 39, 42, 45, 46, 55, 59, 61, 62, 67, 86, 97, 105, 106], "length_mask": 5, "sample_mask": 5, "drawn": [5, 6, 102, 104], "geometr": 5, "second": [5, 9, 10, 16, 34, 65, 72, 87, 96, 100, 103, 104, 106], "featur": [5, 6, 106], "feature_spac": 5, "node_spac": [5, 7], "edge_spac": [5, 7], "seri": [5, 16], "adjac": 5, "matrix": [5, 109], "edge_link": [5, 7], "num_nod": 5, "num_edg": 5, "graphinst": [5, 7], "between": [5, 6, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 87, 89, 90, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106], "don": [5, 11, 17, 19, 21, 37, 47, 48, 49, 50, 51, 71, 86, 91], "edge_mask": 5, "multipli": [5, 92], "attribut": [5, 16, 17, 102, 103], "_gener": 6, "unbound": 6, "mathbb": 6, "interv": [6, 16, 95, 97, 98, 105], "There": [6, 11, 16, 17, 53, 54, 66, 85, 86, 87, 88, 91, 92, 94, 99, 100, 101, 102, 103, 106, 108, 109, 111], "common": [6, 11, 14, 16, 19], "ident": [6, 10, 14, 20], "lower": [6, 16, 95, 96, 97, 98, 99, 102, 103, 104, 105], "upper": [6, 16, 98, 99], "construct": [6, 21, 47, 48, 49, 50, 51, 89, 95, 96, 97, 98, 104, 105], "scalar": [6, 12], "respect": [6, 10, 11, 13, 16, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 87, 89, 95, 98, 99, 104], "assum": [6, 14, 17], "across": [6, 8, 27, 37, 48, 49, 52], "infer": [6, 94], "essenti": 6, "valueerror": [6, 7, 8, 10, 13, 14, 20], "coordin": [6, 11, 14, 85, 87, 93, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105, 106], "shift": [6, 16], "exponenti": [6, 11, 15], "unsupport": 6, "is_bound": 6, "manner": [6, 11, 14, 53], "both": [6, 10, 13, 14, 16, 17, 18, 19, 85, 88, 89, 103, 105, 106, 108, 110, 111], "sens": [6, 106], "One": [6, 16, 95, 98, 99, 106], "neither": [6, 13, 108], "nor": [6, 13, 108, 109], "consist": [6, 11, 14, 16, 17, 21, 34, 85, 89, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108], "mani": [6, 13, 14, 16, 17, 21, 27, 30, 34, 53, 56, 71, 81, 106], "subset": [6, 12, 17, 21, 47, 48, 49, 50, 51], "smallest": 6, "uniformli": [6, 17, 21, 89, 90, 102, 103], "infeas": 6, "sort": 6, "fair": 6, "coin": [6, 106], "toss": 6, "per": [6, 10, 19, 20, 34, 53, 76, 106, 111], "nvec": 6, "int64": [6, 7], "game": [6, 9, 13, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 108], "keyboard": [6, 9, 16], "alwai": [6, 7, 13, 17, 21, 87, 91, 92, 95, 98, 99, 102, 104, 110, 111], "noop": [6, 9, 13, 21, 23, 25, 26, 27, 28, 29, 32, 34, 36, 37, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 55, 58, 60, 61, 62, 64, 65, 67, 72, 74, 75, 77, 78, 79, 81, 82], "nintendo": 6, "conceptu": 6, "arrow": [6, 16, 65], "left": [6, 16, 17, 21, 23, 25, 26, 27, 28, 32, 36, 37, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 58, 60, 61, 62, 64, 67, 71, 72, 74, 75, 77, 78, 81, 82, 85, 86, 87, 90, 91, 95, 98, 99, 100, 101, 105, 109, 110], "param": 6, "min": [6, 12, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "max": [6, 12, 13, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "press": [6, 9, 16, 86, 89], "although": 6, "rare": 6, "d": [6, 9, 89, 102, 103], "categor": 6, "vector": [6, 9, 11, 85, 87, 99, 100, 101, 102, 103, 110], "count": [6, 85, 87, 108], "complic": [6, 11, 16], "kind": 6, "unless": [6, 11, 17, 111], "max_length": 6, "min_length": 6, "charset": 6, "frozenset": 6, "6": [6, 7, 21, 25, 26, 27, 28, 32, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 55, 58, 60, 62, 76, 77, 78, 81, 82, 89, 91, 92, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105, 109, 111], "7": [6, 9, 20, 21, 25, 27, 28, 32, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 55, 58, 60, 62, 77, 78, 81, 82, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105], "8": [6, 9, 10, 18, 20, 21, 23, 25, 27, 28, 30, 32, 36, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 55, 58, 60, 61, 77, 81, 82, 86, 87, 89, 90, 93, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105, 110], "9": [6, 8, 10, 20, 21, 25, 28, 33, 42, 47, 48, 49, 50, 51, 55, 58, 68, 77, 82, 89, 93, 95, 96, 97, 98, 99, 100, 102, 103, 105, 108], "c": [6, 20, 70, 87, 89, 106], "f": [6, 14, 15, 110], "h": [6, 110], "j": [6, 21], "k": [6, 7, 9, 13, 87, 104], "l": [6, 13, 104], "m": [6, 7, 17, 20, 21, 40, 89, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "o": [6, 20], "p": [6, 96, 110, 111], "q": [6, 19, 67, 111], "w": [6, 9, 16, 95, 98, 99], "z": [6, 95, 96, 97, 98, 99, 102, 103, 105], "compris": 6, "charact": [6, 9, 55, 66], "b5": 6, "hello": 6, "0123456789": 6, "digit": [6, 106], "inclus": [6, 21], "prevent": [6, 10, 44, 106], "empti": [6, 8, 13, 71], "english": 6, "alphabet": 6, "plu": [6, 37, 109], "latin": 6, "charlist": 6, "zero": [6, 8, 17, 19, 20, 93, 96, 106], "matter": 6, "equival": [7, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "would": [7, 12, 14, 15, 16, 17, 95, 96, 97, 98, 99, 104, 105], "notimplementederror": 7, "cannot": [7, 8, 13, 17, 19, 109], "attempt": [7, 20, 87, 99, 100], "compound": 7, "func": 7, "oper": [7, 13, 20], "itself": [7, 10, 11, 13, 16], "boundari": 7, "while": [7, 17, 19, 20, 21, 24, 25, 41, 56, 59, 60, 61, 62, 65, 67, 69, 71, 75, 78, 80, 87, 89, 90, 93, 95, 96, 98, 99, 102, 103, 104, 106, 108], "being": [7, 13, 16, 42, 91, 92, 93, 95, 98, 99, 103, 106, 111], "exactli": [7, 104], "origin": [7, 10, 12, 13, 14, 86, 89, 100, 102, 103, 106], "effect": [7, 8, 11, 13, 14, 16, 21, 47, 48, 49, 50, 51, 87, 100, 101, 111], "flattenend": 7, "60": [7, 55, 68, 106], "recurs": 7, "12": [7, 21, 28, 30, 34, 36, 47, 48, 49, 50, 51, 55, 58, 70, 87, 89, 90, 95, 96, 97, 98, 99, 102, 105], "hot": 7, "match": [7, 10, 12, 76], "copi": [8, 10, 17, 20, 106], "item": [8, 9, 106], "_": [8, 9, 10, 11, 16, 112], "6348213": 8, "28607962": 8, "60760117": 8, "87383074": 8, "192658": 8, "2148103": 8, "output": [8, 9, 13, 16], "99644893": 8, "08304597": 8, "7238421": 8, "35848552": 8, "1533453": 8, "67958736": 8, "49076623": 8, "38661423": 8, "7975036": 8, "93317133": 8, "stopiter": 8, "fn": 8, "built": [8, 106], "multi_binari": 8, "multi_discret": 8, "ctx": 8, "multiprocess": [8, 10, 20], "opt": 8, "hostedtoolcach": 8, "14": [8, 21, 47, 48, 49, 50, 51, 55, 85, 87, 95, 96, 98, 99, 102, 105], "x64": 8, "lib": [8, 109], "python3": 8, "process": [8, 9, 10, 14, 17, 19, 20, 89, 102], "eventu": 8, "shared_memori": [8, 10, 20], "customspaceerror": 8, "read": [8, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111], "forward": [8, 32, 54, 85, 95, 96, 97, 98, 99, 104, 105], "vice": [8, 13], "versa": [8, 13], "side": [8, 14, 23, 36, 51, 53, 87], "write": [8, 10, 17, 20], "num_env": [8, 10, 20], "plai": [9, 17, 31, 44, 57, 76, 81, 86, 106, 108], "transpos": [9, 17], "zoom": 9, "callback": [9, 16], "keys_to_act": [9, 16], "dw": 9, "so": [9, 10, 11, 13, 14, 16, 17, 19, 20, 21, 49, 72, 87, 88, 95, 96, 97, 98, 99, 100, 101, 104, 105, 106], "particularli": [9, 13, 20, 90], "verifi": 9, "level": [9, 21, 28, 45, 67, 75, 106], "preprocess": [9, 11], "unplay": 9, "wish": [9, 14, 16], "plot": [9, 16], "real": [9, 16, 53, 96, 106], "statist": [9, 16], "playplot": [9, 16], "here": [9, 16, 17, 89], "last": [9, 13, 16, 17, 19, 20, 43, 44, 54, 96, 99, 102, 103], "150": 9, "def": [9, 11, 12, 14, 15, 16, 17, 20], "obs_t": [9, 16], "obs_tp1": [9, 16], "rew": [9, 16, 19], "plotter": [9, 16], "execut": [9, 12, 17, 20, 21, 44, 106, 111], "render_fp": [9, 13, 17], "30": [9, 13, 16, 21, 65, 68, 98, 99], "amount": [9, 41, 43, 44, 46, 52, 71, 85, 90, 100, 101], "input": [9, 10, 16, 20], "receiv": [9, 10, 16, 19, 20, 31, 34, 38, 41, 42, 48, 54, 57, 86, 87, 92, 105], "map": [9, 14, 16, 17, 39, 110, 111], "unicod": 9, "suppos": [9, 16], "trigger": [9, 111], "key_to_act": [9, 16], "ord": [9, 16, 17], "unknown": [9, 106], "horizon_timestep": 9, "plot_nam": 9, "live": [9, 24, 27, 30, 31, 33, 36, 41, 42, 45, 52, 56, 57, 63, 69, 74], "transit": [9, 16, 19, 21, 47, 48, 49, 50, 51, 98, 99, 111], "compute_metr": 9, "obs_tp": 9, "cumulative_reward": 9, "linalg": [9, 17], "norm": [9, 17, 102, 103], "its": [9, 10, 12, 13, 36, 43, 66, 78, 83, 87, 93, 94, 104, 106], "along": [9, 11, 16, 20, 55, 56, 58, 69, 86, 90, 91, 92, 96, 100, 101, 104], "conjunct": 9, "evolv": 9, "200": [9, 46, 69, 87, 89, 90, 91, 93], "immedi": [9, 11, 15, 17, 108], "cumul": [9, 11, 13], "magnitud": [9, 87, 92, 100, 101], "your_env": 9, "len": [9, 12], "horizon": [9, 19, 71, 97, 105], "titl": [9, 91, 92], "dependencynotinstal": [9, 13], "matplotlib": 9, "playablegam": 9, "process_ev": 9, "event": [9, 17, 106], "particular": [9, 11, 14, 18, 19, 20, 87], "keep": [9, 11, 13, 17, 29, 42, 61, 64, 72, 73, 81, 90, 99], "track": [9, 11, 13, 73, 86, 90, 95, 96, 97, 98, 99, 100, 101, 104, 105], "exit": [9, 10], "save_video": 9, "video_fold": [9, 13], "episode_trigg": [9, 13], "step_trigg": [9, 13], "video_length": [9, 13], "name_prefix": [9, 13], "rl": [9, 13, 16, 19, 112], "episode_index": 9, "step_starting_index": 9, "extract": 9, "compos": 9, "record": [9, 11, 85], "store": [9, 10, 13], "iff": [9, 13, 17], "isn": 9, "entir": [9, 13, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 97, 105, 106], "snippet": [9, 13], "captur": [9, 13, 80], "Will": [9, 13], "prepend": [9, 13], "filenam": [9, 13], "moviepi": 9, "imagesequenceclip": 9, "durat": [9, 95, 97, 98, 99, 100, 101, 102, 103, 105], "step_index": 9, "199": 9, "capped_cubic_video_schedul": 9, "episode_id": 9, "27": [9, 89, 95, 98, 99], "729": 9, "1000": [9, 13, 16, 20, 69, 71, 86, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 112], "2000": [9, 85], "3000": 9, "schedul": [9, 110], "step_api_compat": [9, 18], "step_return": 9, "output_truncation_bool": [9, 13, 16], "is_vector_env": 9, "doc": [9, 13, 87], "ob": [9, 11, 14, 111], "interfac": [9, 106, 112], "conflict": [9, 106], "written": [9, 11, 106], "final": [9, 10, 13, 17, 19, 54], "desir": [9, 104, 105], "oldenv": 9, "vec_env": 9, "convert_to_terminated_truncated_step_api": [9, 18], "irrespect": 9, "convert_to_done_step_api": 9, "omit": [9, 94, 95, 96, 97, 98, 99, 104, 105], "env_check": [9, 16], "check_env": [9, 16], "skip_render_check": [9, 16], "invas": [9, 75], "farama": [9, 11, 17], "org": [9, 21, 106], "content": 9, "environment_cr": 9, "ignor": [9, 21, 108], "skip": [9, 13, 17, 21], "ci": 9, "parallel": [10, 20], "linear": [10, 20, 87, 89, 100, 101, 104], "speed": [10, 32, 85, 86, 106, 111], "taken": [10, 13, 17, 20, 45, 51, 88, 90, 111], "wait": [10, 19, 45, 47, 71], "until": [10, 11, 17, 44, 57, 102, 108], "overwritten": [10, 11], "final_observ": [10, 13, 20], "final_info": [10, 13], "asyncvectorenv": [10, 20], "syncvectorenv": [10, 20], "single_observation_spac": [10, 20], "single_action_spac": [10, 20], "v25": 10, "old": [10, 11, 13, 16, 18, 112], "vectorlistinfo": [10, 11, 13], "rememb": [10, 13, 17, 86], "share": 10, "other": [10, 11, 12, 13, 14, 17, 20, 27, 36, 39, 47, 53, 87, 93, 94, 96, 100, 102, 103, 105, 111], "word": [10, 102], "02240574": 10, "03439831": 10, "03904812": 10, "02810693": 10, "01586068": 10, "01929009": 10, "02394426": 10, "04016077": 10, "01314174": 10, "03893502": 10, "02400815": 10, "0038326": 10, "instead": [10, 14, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 89, 105], "00122802": [10, 20], "16228443": [10, 20], "02521779": [10, 20], "23700266": [10, 20], "00788269": [10, 20], "17490888": [10, 20], "03393489": [10, 20], "31735462": [10, 20], "04918966": [10, 20], "19421194": [10, 20], "02938497": [10, 20], "29495203": [10, 20], "releas": [10, 17, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 89, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 109, 110, 111], "resourc": [10, 17], "viewer": 10, "close_extra": 10, "synchron": 10, "asynchron": 10, "garbag": 10, "program": [10, 106], "04456399": 10, "04653909": 10, "01326909": 10, "02099827": 10, "03073904": 10, "00145001": 10, "03088818": 10, "03131252": 10, "03468829": 10, "01500225": 10, "01230312": 10, "01825218": 10, "registri": [10, 18], "env_fn": [10, 20], "context": [10, 20], "daemon": 10, "worker": [10, 20, 65], "pipe": 10, "commun": 10, "lambda": [10, 14, 15, 20], "81": [10, 20, 93], "62": [10, 20], "8286432": 10, "5597771": 10, "90249056": 10, "85009176": 10, "5266346": 10, "60007906": 10, "back": [10, 11, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 49, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 95, 96], "improv": 10, "effici": [10, 14, 91, 92, 100, 106], "larg": [10, 11, 20, 92, 95, 96, 97, 98, 99, 102, 103, 104, 105, 106], "subprocess": 10, "flag": [10, 91, 106], "turn": [10, 13, 16, 24, 25, 86, 87, 100], "quit": [10, 17], "head": [10, 96], "spawn": [10, 20, 103], "children": 10, "overrid": [10, 11], "inner": 10, "logic": [10, 17, 86], "advanc": [10, 89, 106], "degre": [10, 14, 98, 99, 100], "flexibl": [10, 106], "chanc": 10, "shoot": [10, 28, 37, 39, 44, 45, 52, 53, 62, 65, 69, 74, 75, 83], "yourself": [10, 17, 20, 45, 65, 86], "foot": [10, 96, 97, 105], "thu": [10, 21, 47, 48, 49, 50, 51, 102, 103, 106], "own": [10, 20, 36, 71], "_worker": 10, "_worker_shared_memori": 10, "runtimeerror": [10, 20], "serial": 10, "modular": [11, 12, 14, 15, 16, 17, 106], "behavior": [11, 16, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 93, 95, 96, 97, 98, 99, 104, 105, 106], "modif": [11, 16, 102, 103], "without": [11, 16, 17, 43, 98, 108, 110], "alter": [11, 16, 17, 21], "lot": [11, 16], "boilerpl": [11, 16, 17], "chain": [11, 16, 89, 104], "rescaleact": [11, 12, 16], "base_env": [11, 16], "wrapped_env": [11, 12, 13, 16, 17], "min_act": [11, 12, 16], "max_act": [11, 12, 16], "access": [11, 13, 20, 52, 106], "underneath": [11, 16, 90], "anoth": [11, 19, 20, 36, 98, 99, 101, 102, 103, 105, 111], "orderenforc": [11, 13, 17], "get": [11, 16, 19, 20, 21, 41, 44, 45, 46, 53, 63, 64, 65, 66, 68, 69, 70, 75, 85, 87, 95, 97, 98, 100, 108], "layer": [11, 16, 106], "bare": 11, "just": [11, 16, 47, 53, 70, 101, 103], "box2d": [11, 16, 85, 86, 87], "bipedal_walk": [11, 16, 85], "0x7f87d70712d0": [11, 16], "three": [11, 16, 17, 21, 24, 27, 29, 42, 50, 56, 63, 68, 69, 70, 71, 95, 97, 98, 99, 104, 105], "thing": [11, 14, 16, 20, 21], "do": [11, 13, 14, 15, 16, 17, 21, 34, 46, 67, 71, 72, 86, 87, 89, 95, 96, 97, 98, 104, 105, 106], "Such": [11, 16], "actionwrapp": [11, 12, 16], "observationwrapp": [11, 14, 16, 17], "rewardwrapp": [11, 15, 16], "present": [11, 17, 19, 89, 106], "section": [11, 16, 17, 20, 21, 72, 95, 96, 97, 98, 104, 105], "found": [11, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 94], "github": [11, 17, 94, 109], "com": [11, 17, 106, 109], "foundat": [11, 17], "forget": [11, 17], "commonli": [11, 16], "page": [11, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 108, 109, 110, 111], "descript": [11, 17, 106], "ataripreprocess": [11, 13], "misc": 11, "tp": 11, "atari": [11, 18, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "clipact": [11, 12, 16], "clip": [11, 15, 16, 17, 91, 92, 95, 98], "envcompat": [11, 13], "compat": [11, 14, 20, 106, 112], "21": [11, 18, 95, 98, 99, 102, 108], "filterobserv": [11, 14], "filter": 11, "request": [11, 108], "framestack": [11, 13], "anobserv": 11, "stack": [11, 14, 20], "roll": [11, 14, 34, 102], "grayscaleobserv": [11, 14], "grai": [11, 13], "scale": [11, 13, 15, 21, 87, 95, 96, 97, 98, 104, 105, 106], "humanrend": [11, 13], "normalizeobserv": [11, 14], "center": [11, 14, 86, 87, 90, 93, 95, 96, 98, 99, 106, 109], "unit": [11, 14, 55, 89, 91, 92, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "varianc": [11, 14, 15], "normalizereward": [11, 15], "averag": [11, 15, 19, 98], "pixelobservationwrapp": [11, 14], "augment": [11, 14], "obtain": [11, 13, 16, 19, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 93, 108], "ad": [11, 13, 14, 17, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 49, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 87, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 111], "replac": [11, 108], "recordepisodestatist": [11, 13], "recordvideo": [11, 13], "rollout": [11, 13, 111], "save": [11, 13], "rescal": [11, 16], "resizeobserv": [11, 14], "axbxc": [11, 14], "resiz": [11, 13], "timeawareobserv": [11, 14, 16], "trajectori": [11, 14, 15, 87, 98, 99], "append": [11, 14], "transformobserv": [11, 14], "transformreward": [11, 15], "th": [11, 20], "sometim": [11, 15, 16, 17, 20], "still": [11, 18, 21], "let": [11, 12, 15, 16, 17, 21, 36, 106], "penal": [11, 72], "energi": [11, 85, 87, 90, 106], "weight": [11, 19, 20, 95, 96, 97, 98, 102, 103, 104, 105, 106], "those": [11, 20, 23, 25, 26, 27, 28, 29, 32, 34, 36, 37, 41, 43, 44, 45, 46, 55, 58, 60, 61, 62, 64, 65, 67, 72, 74, 75, 77, 78, 79, 81, 82, 89, 94, 95, 96, 97, 98, 99, 100, 101, 105], "nevertheless": 11, "reacherrewardwrapp": 11, "reward_dist_weight": 11, "reward_ctrl_weight": 11, "reward_dist": [11, 102, 103], "reward_ctrl": [11, 102, 103], "suffici": [11, 27, 29, 31, 33, 38], "simpli": [12, 13, 14, 15, 17, 21, 109], "overwrit": [12, 14, 15], "domain": [12, 86, 89, 91, 92, 106, 111], "sai": [12, 13, 16], "discreteact": 12, "disc_to_cont": 12, "act": 12, "__name__": [12, 20], "__main__": [12, 20], "print": [12, 17], "among": [12, 14, 88, 94], "biped": [12, 84, 98, 99], "walker": [12, 84, 94, 103, 105], "affin": [12, 87], "75": [12, 95], "noop_max": 13, "frame_skip": [13, 95, 96, 97, 98, 104, 105], "screen_siz": 13, "84": [13, 95, 98, 99], "terminal_on_life_loss": 13, "grayscale_ob": 13, "grayscale_newaxi": 13, "scale_ob": 13, "2600": [13, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "guidelin": 13, "machado": [13, 21], "et": [13, 21], "al": [13, 18, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "2018": [13, 21, 89], "revisit": [13, 21], "arcad": [13, 21, 28, 45, 47, 48, 49, 50, 51, 106], "evalu": [13, 21, 106], "protocol": [13, 21], "open": [13, 16, 17, 21, 34, 94, 106], "problem": [13, 19, 21, 87, 90, 93, 100, 101, 104, 108, 111, 112], "stage": 13, "op": 13, "pool": [13, 104], "recent": [13, 14, 15, 18, 106], "life": [13, 27, 41, 45, 69, 73], "lost": [13, 30, 38, 57, 70, 74], "loss": [13, 108], "off": [13, 16, 38, 53, 61, 69, 86, 87, 111], "Not": 13, "squar": [13, 14, 17, 70, 102, 103, 111], "210x180": 13, "84x84": 13, "grayscal": [13, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "colour": [13, 86], "greyscal": 13, "255": [13, 14, 17, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 86], "No": [13, 89, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "frequenc": 13, "experi": [13, 95, 98, 99, 100, 101, 106], "whenev": [13, 17, 27, 30], "channel": 13, "axi": [13, 20, 91, 92, 96, 98, 99, 104], "dimension": [13, 16, 17, 25, 87, 95, 96, 97, 103, 104, 105, 106], "memori": [13, 14, 91, 92], "optim": [13, 21, 85, 87, 98, 99, 106], "benefit": 13, "opencv": 13, "caus": [13, 54], "new_ob": 13, "final_reward": 13, "final_termin": 13, "final_trunc": 13, "final_don": 13, "prior": [13, 106], "alongsid": [13, 16, 106], "previou": [13, 19, 95, 98, 99], "re": [13, 17, 20, 53, 68, 71], "old_env": 13, "legacyenv": 13, "retun": 13, "modern": [13, 106], "convers": [13, 106], "passiveenvcheck": 13, "cartpoleenv": 13, "customenv": [13, 16], "manual": [13, 16, 21, 47, 48, 49, 50, 51, 106], "unregist": [13, 20], "surround": [13, 106], "test": [13, 17, 85, 106], "haven": 13, "screen": [13, 21, 23, 27, 31, 36, 37, 39, 48, 54, 60, 70, 71, 95, 96, 97, 98, 99, 100, 101, 104, 105], "nativ": [13, 107], "nonativerend": 13, "disable_render_order_enforc": 13, "classic_control": [13, 88], "resetneed": 13, "deque_s": 13, "At": [13, 20, 30, 41, 44, 55], "_episod": 13, "elaps": 13, "sinc": [13, 16, 17, 18, 19, 20, 21, 47, 48, 49, 50, 51, 84, 90, 94, 103, 106, 111], "begin": [13, 17, 27, 30, 43, 68, 69, 70, 71], "num": [13, 21, 23, 25, 26, 27, 28, 29, 32, 34, 36, 37, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 55, 58, 60, 61, 62, 64, 65, 67, 72, 74, 75, 77, 78, 79, 81, 82, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "buffer": [13, 14, 86, 106], "return_queu": 13, "length_queu": 13, "intermitt": 13, "hundredth": 13, "emploi": 13, "stop": [13, 19, 65, 75, 83, 106, 108], "span": 13, "strictli": 13, "pop_fram": 13, "reset_clean": 13, "clear": [13, 75], "issu": [13, 16, 17, 21, 95, 97, 98, 99, 105], "place": [13, 17, 25, 90, 91, 92], "part": [13, 19, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111], "\u01f9one": 13, "intend": [13, 106, 110], "around": [13, 31, 84, 103, 106], "outermost": 13, "actual": [13, 17, 111], "_k": 13, "classic": [13, 16, 19, 87, 89, 90, 91, 92, 93, 97, 101, 104, 105], "reflect": [14, 90], "2d": [14, 103, 106], "navig": [14, 16, 17, 30, 66], "agent_posit": 14, "target_posit": 14, "throw": [14, 16, 56], "awai": [14, 24, 64, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "freedom": [14, 98, 99, 100], "target": [14, 17, 19, 37, 89, 102, 103, 106], "rel": [14, 17, 89, 98, 99], "relativeposit": [14, 17], "ideal": 14, "subclass": 14, "accordingli": [14, 17, 71], "were": [14, 17, 38, 84, 89, 107], "incorrectli": [14, 19], "randn": [14, 20], "08319338": 14, "04635121": 14, "07394746": 14, "20877492": 14, "filter_kei": 14, "00067088": 14, "01860439": 14, "04772898": 14, "01911527": 14, "04560107": 14, "04466959": 14, "0328232": 14, "02367178": 14, "04649447": 14, "14996664": 14, "03329664": 14, "25847703": 14, "96": [14, 21, 86], "27648": 14, "num_stack": 14, "lz4_compress": 14, "lazyfram": 14, "fill": [14, 17, 30], "lz4": 14, "compress": 14, "keep_dim": 14, "uint8": [14, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "singleton": 14, "axbx1": 14, "axb": 14, "epsilon": [14, 15, 106], "1e": [14, 15, 98, 104, 105], "08": [14, 15], "past": [14, 15], "newli": [14, 15], "stabil": [14, 15, 98, 99], "pixels_onli": 14, "render_kwarg": 14, "pixel_kei": 14, "choos": [14, 17, 20], "odict_kei": 14, "400": [14, 111], "600": [14, 106], "discard": 14, "assertionerror": 14, "show": [14, 21, 31, 37, 108], "typeerror": 14, "unexpect": 14, "64": [14, 21], "03810719": 14, "03522411": 14, "02231044": 14, "01088205": 14, "03881167": 14, "16021058": 14, "0220928": 14, "28875574": 14, "becaus": [15, 16, 17, 20], "intrins": 15, "gain": [15, 31, 67, 73, 74, 77], "numer": [15, 99, 100, 101, 108], "clipreward": 15, "min_reward": 15, "max_reward": 15, "invari": 15, "incorrect": [15, 19], "gamma": [15, 19], "99": 15, "discount": [15, 19], "factor": 15, "veri": [16, 17, 87, 102, 106], "easi": [16, 57, 106, 107], "loop": [16, 20, 106], "torqu": [16, 85, 89, 93, 95, 96, 97, 98, 99, 102, 103, 104, 105], "motor": [16, 85, 104], "exchang": 16, "manipul": [16, 106], "robot": [16, 19, 33, 83, 85, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "succe": 16, "toward": [16, 29, 53, 104], "did": [16, 19], "yet": 16, "train": [16, 111], "maxim": 16, "accumul": [16, 43], "crash": [16, 87], "succeed": 16, "onward": [16, 19], "earlier": [16, 17], "someth": 16, "similarli": [16, 20, 87], "previous": [16, 21, 30], "core": [16, 106], "inher": [16, 19], "failur": [16, 19], "explain": 16, "retain": 16, "toggl": 16, "explicitli": [16, 17, 19], "saniti": 16, "util": [16, 17, 18, 20], "seem": 16, "mistak": 16, "best": [16, 21, 47, 48, 49, 50, 51, 106], "practic": [16, 19, 21, 47, 48, 49, 50, 51, 106], "reus": 16, "our": [16, 17, 106], "simpl": [16, 19, 85, 107, 109, 112], "6952509": 16, "4399011": 16, "7981693": 16, "li": [16, 106], "lie": 16, "markov": [16, 19], "aspect": [16, 19], "pong": [16, 18, 21, 36, 40], "k_left": 16, "k_right": 16, "constant": [16, 32, 71, 87, 92, 95, 97, 98, 105], "furthermor": 16, "gameplai": 16, "document": [17, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 88, 95, 98, 99, 100, 107], "overview": 17, "relev": 17, "design": [17, 54, 89, 95, 98, 99, 107, 111], "clone": [17, 106], "virtual": [17, 106], "git": 17, "venv": 17, "bin": 17, "activ": [17, 70], "concern": 17, "readm": 17, "setup": 17, "gym_exampl": 17, "grid_world": 17, "relative_posit": 17, "reacher_weighted_reward": 17, "discrete_act": 17, "clip_reward": 17, "illustr": [17, 19], "simplist": 17, "gridworldenv": 17, "grid": [17, 25, 106, 111], "vertic": [17, 27, 85, 100, 101, 106], "horizont": [17, 27, 37, 85, 87, 89], "cell": [17, 106, 109], "locat": [17, 21, 57, 106, 111], "movement": [17, 99], "soon": [17, 111], "spars": [17, 89, 106], "blue": [17, 49, 51, 76, 89], "red": [17, 45, 51], "piec": 17, "abstract": 17, "shouldn": 17, "framer": [17, 21, 99, 102, 103], "window_s": 17, "512": 17, "encod": [17, 109, 111], "direct": [17, 69, 71, 89, 90, 91, 92, 95, 97, 98, 100, 101, 105, 106, 110], "walk": [17, 98, 105, 107, 110], "_action_to_direct": 17, "assert": 17, "clock": 17, "remain": [17, 19, 52, 55, 56, 71, 95, 109], "privat": [17, 40, 66], "_get_ob": 17, "translat": [17, 95, 98, 99], "mandatori": 17, "_agent_loc": 17, "_target_loc": 17, "manhattan": 17, "distanc": [17, 29, 46, 96], "_get_info": 17, "oftentim": 17, "determinist": [17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 89, 91, 92, 109, 111], "worri": 17, "coincid": 17, "array_equ": 17, "_render_fram": 17, "trivial": 17, "gather": [17, 45, 66], "leav": [17, 30, 90, 94, 100], "els": [17, 97, 105, 110], "approach": [17, 100], "skeleton": 17, "init": [17, 86], "set_mod": 17, "canva": 17, "surfac": [17, 47, 71, 100, 101], "pix_square_s": 17, "rect": 17, "circl": [17, 26], "gridlin": 17, "width": 17, "visibl": 17, "blit": 17, "get_rect": 17, "pump": 17, "predefin": [17, 106], "delai": 17, "stabl": 17, "tick": 17, "surfarrai": 17, "pixels3d": 17, "bother": 17, "detect": 17, "put": 17, "registr": [17, 18], "300": [17, 34, 46, 85], "compon": 17, "appropri": [17, 20], "apart": [17, 45], "entrypoint": 17, "mere": 17, "extra": [17, 25, 30, 31, 33, 37, 39, 52, 71, 106], "third": 17, "parti": 17, "codebas": 17, "librari": [17, 106, 107, 112], "edit": 17, "configur": [17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 88, 94, 106, 107], "setuptool": 17, "install_requir": 17, "local": 17, "perfectli": 17, "fine": 17, "variant": [17, 86], "instruct": [17, 94], "touch": [17, 33, 66], "top": [17, 21, 36, 41, 48, 54, 56, 70, 86, 87, 88, 91, 92, 97, 100, 101, 105], "big": [17, 26, 47], "advantag": [17, 95, 106], "job": [17, 29], "regist": [18, 20, 21], "sole": 18, "introduc": [18, 95, 98, 99], "v5": [18, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "increas": [18, 20, 43, 71, 87, 89, 90, 97, 104, 105], "backward": [18, 96], "eval": 18, "rst": 18, "definit": [19, 95, 97, 98], "success": [19, 44, 89, 111], "fall": [19, 41, 43, 63, 69, 85, 98, 110], "notabl": 19, "preserv": 19, "decis": [19, 106], "infinit": [19, 87, 97, 105, 108], "obviou": 19, "forev": 19, "forcibli": 19, "halt": 19, "idea": 19, "estim": [19, 95], "tell": 19, "abl": [19, 71], "formal": 19, "q_": 19, "o_t": 19, "a_t": 19, "r_t": 19, "max_a": 19, "o_": 19, "a_": 19, "q_target": 19, "deep": [19, 106], "distinct": 19, "becom": [19, 70, 84, 106], "frequent": 19, "differenti": 19, "shown": [19, 56, 86, 89], "vf_target": 19, "vf_next_stat": 19, "happen": [19, 70, 91, 92, 95, 97, 98, 99, 100, 101, 102, 103, 105], "suppli": [19, 37, 61], "sequenti": 20, "meant": 20, "basic": 20, "These": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 94, 95, 98, 104, 106, 107], "graviti": [20, 87, 90, 91, 93, 100, 101, 106], "exact": [20, 21, 34, 47, 48, 49, 50, 51, 108], "forkserv": 20, "standard": [20, 53, 95, 96, 100, 106], "02792548": 20, "04423395": 20, "00026012": 20, "04486719": 20, "04906582": 20, "02779809": 20, "02881928": 20, "04467649": 20, "0036706": 20, "00324916": 20, "047668": 20, "02039891": 20, "00187507": 20, "18986781": 20, "03168437": 20, "301252": 20, "02643229": 20, "18816885": 20, "04371385": 20, "3034975": 20, "02803041": 20, "24251814": 20, "02660446": 20, "29707024": 20, "regardless": [20, 95, 96, 97, 98, 104, 105], "arbitrarili": 20, "thereof": 20, "dictenv": 20, "fire": [20, 21, 23, 25, 26, 28, 29, 32, 34, 36, 37, 47, 48, 49, 50, 51, 54, 61, 62, 64, 65, 67, 68, 70, 71, 74, 75, 77, 79, 81, 82, 87], "jump": [20, 54, 69, 72], "acceler": [20, 86, 91, 92, 93], "5337036": 20, "7439302": 20, "41748118": 20, "9373266": 20, "5780453": 20, "8987405": 20, "917269": 20, "5888639": 20, "812942": 20, "23626241": 20, "0616814": 20, "4057572": 20, "4875375": 20, "26341468": 20, "72282314": 20, "3rd": 20, "fell": 20, "hole": [20, 63, 110], "is_slipperi": [20, 110], "prob": 20, "_prob": 20, "pair": [20, 98, 99], "_kei": 20, "logical_or": 20, "11350546": 20, "8090094": 20, "23710881": 20, "8017728": 20, "_final_observ": 20, "equal": [20, 91, 92, 100, 108, 110], "handi": 20, "thank": 20, "whole": 20, "scipi": 20, "special": [20, 24, 54], "softmax": [20, 106], "logit": 20, "argmax": [20, 111], "sent": 20, "expens": 20, "transfer": [20, 106], "cost": [20, 85, 96, 97, 104, 105, 106], "throughput": 20, "breakoutnoframeskip": 20, "timeit": 20, "23": [20, 95, 98, 99, 102, 106], "136": 20, "\u00b5": 20, "std": 20, "36": [20, 21, 36, 98, 99], "15": [20, 21, 44, 47, 48, 49, 50, 51, 55, 74, 87, 95, 96, 98, 99, 102, 105, 106, 110], "plan": [20, 106], "try": [20, 23, 24, 25, 34, 36, 41, 64, 65], "errorenv": 20, "shut": 20, "raw": 20, "smilesenv": 20, "whose": [20, 106, 108], "smile": 20, "notat": 20, "molecular": 20, "symbol": [20, 106], "__eq__": 20, "co": [20, 89, 91, 92, 93, 100, 103, 106], "_state": 20, "pickleabl": 20, "stella": 21, "adventur": [21, 40], "air": [21, 40], "raid": [21, 40], "alien": [21, 40, 42, 62, 75], "amidar": [21, 29, 40], "assault": [21, 40], "asterix": [21, 40], "asteroid": [21, 40], "atlanti": [21, 40], "licens": [21, 106], "download": [21, 106], "agre": 21, "todo": 21, "legal": [21, 47, 48, 49, 50, 51], "upright": [21, 27, 28, 32, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 55, 60, 90, 93, 100, 101], "upleft": [21, 27, 28, 32, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 55, 60], "downright": [21, 27, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 55, 58, 60], "downleft": [21, 27, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 55, 58, 60], "upfir": [21, 25, 28, 34, 47, 48, 49, 50, 51, 65, 77, 78, 79, 81, 82], "11": [21, 28, 47, 48, 49, 50, 51, 55, 58, 95, 96, 97, 98, 99, 100, 102, 103, 105, 108, 109], "rightfir": [21, 23, 25, 26, 28, 29, 32, 37, 47, 48, 49, 50, 51, 55, 58, 61, 62, 64, 74, 77, 78, 81, 82], "leftfir": [21, 23, 25, 26, 28, 29, 37, 47, 48, 49, 50, 51, 55, 58, 61, 62, 64, 74, 77, 78, 81, 82], "13": [21, 28, 47, 48, 49, 50, 51, 55, 58, 95, 96, 98, 99, 102, 105], "downfir": [21, 25, 28, 34, 47, 48, 49, 50, 51, 55, 58, 62, 65, 77, 79, 82], "uprightfir": [21, 28, 47, 48, 49, 50, 51, 55, 58], "upleftfir": [21, 28, 47, 48, 49, 50, 51, 55, 58], "16": [21, 30, 33, 36, 42, 47, 48, 49, 50, 51, 55, 93, 95, 96, 98, 99, 102, 105, 106, 110], "downrightfir": [21, 47, 48, 49, 50, 51, 55, 58], "17": [21, 33, 47, 48, 49, 50, 51, 55, 95, 96, 98, 99, 102, 105, 108], "downleftfir": [21, 47, 48, 49, 50, 51, 55, 58], "smaller": [21, 26, 28, 47, 48, 49, 50, 51], "enumer": [21, 47, 48, 49, 50, 51], "expand": [21, 47, 48, 49, 50, 51], "full": [21, 47, 48, 49, 50, 51, 86, 87], "full_action_spac": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "reduc": [21, 23, 25, 26, 27, 28, 29, 32, 34, 36, 37, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 55, 58, 60, 61, 62, 64, 65, 67, 72, 74, 75, 77, 78, 79, 81, 82, 90], "difficulti": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 106], "choic": 21, "player": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 108], "128": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "byte": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "ram": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "consol": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "atariag": [21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 76, 78, 79, 80, 81, 82, 83], "art": 21, "memor": 21, "sticki": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "small": [21, 51, 70, 85, 106, 107], "On": [21, 62, 89, 90, 91, 92, 93], "repeat": [21, 102], "frameskip": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "exclus": 21, "tabl": [21, 24, 25, 27, 41, 43, 98, 99, 102], "obs_typ": 21, "Its": 21, "repeat_action_prob": [21, 47, 48, 49, 50, 51], "stick": [21, 30, 52, 108], "ll": [21, 54, 71], "sound": [21, 106], "lock": 21, "emul": 21, "proper": 21, "audio": 21, "outlin": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 108], "variat": 21, "amidardeterminist": 21, "amidarnoframeskip": 21, "ramdeterminist": 21, "ramnoframeskip": 21, "suffix": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "noframeskip": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "airraid": [21, 23], "31": [21, 28, 98, 99], "bankheist": [21, 30], "20": [21, 30, 36, 63, 71, 87, 95, 98, 99, 102, 106, 111], "24": [21, 30, 36, 61, 85, 86, 87, 90, 95, 98, 99], "28": [21, 30, 36, 89, 98, 99], "battlezon": [21, 31], "beamrid": [21, 32], "berzerk": [21, 40], "18": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 95, 96, 98, 99, 102, 105], "bowl": [21, 40], "breakout": [21, 40], "32": [21, 36, 53, 98, 99, 108], "40": [21, 36, 61, 98, 99], "44": [21, 36, 98, 99], "carniv": [21, 40], "centiped": [21, 40], "22": [21, 38, 95, 98, 99, 102], "86": [21, 38], "choppercommand": [21, 39], "crazyclimb": [21, 41], "defend": [21, 29, 40, 45, 61, 73], "demonattack": [21, 43], "doubledunk": [21, 44], "elevatoract": [21, 45], "enduro": [21, 40], "fishingderbi": 21, "freewai": [21, 40], "frostbit": [21, 40], "gopher": [21, 40], "gravitar": [21, 40], "hero": [21, 40], "icehockei": 21, "jamesbond": [21, 40], "journeyescap": 21, "kangaroo": [21, 40], "krull": [21, 40], "kungfumast": [21, 58], "montezumareveng": [21, 59], "mspacman": [21, 60], "namethisgam": [21, 61], "phoenix": [21, 40], "pitfal": [21, 40, 85], "pooyan": [21, 40], "50": [21, 55, 65, 71, 87, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "70": [21, 65], "privateey": 21, "qbert": [21, 40], "riverraid": [21, 40], "roadrunn": [21, 69], "robotank": [21, 40, 70], "seaquest": [21, 40], "ski": [21, 40], "solari": [21, 40], "spaceinvad": 21, "stargunn": 21, "tenni": [21, 40], "timepilot": 21, "tutankham": [21, 40], "upndown": [21, 79], "ventur": [21, 40], "videopinbal": [21, 81, 82], "wizardofwor": [21, 82], "yarsreveng": 21, "zaxxon": [21, 40], "oppos": 21, "ai": 21, "mg": 21, "bellemar": 21, "naddaf": 21, "veness": 21, "platform": [21, 106], "journal": 21, "artifici": 21, "intellig": 21, "research": [21, 94, 100, 106], "2012": 21, "url": 21, "jair": 21, "php": 21, "articl": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "view": [21, 51, 106], "11182": 21, "250": [22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "160": [22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "enchant": [22, 38], "chalic": 22, "golden": 22, "castl": 22, "pick": [22, 45, 56, 69, 111], "sword": 22, "bridg": [22, 68, 106], "magnet": 22, "fight": [22, 35, 58, 61, 106], "outmanoeuvr": 22, "dragon": 22, "flavor": [22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "switch": [22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 106], "thorough": [22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "discuss": [22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "intric": [22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "stochast": [22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 88, 89, 91, 92, 94, 95, 96, 97, 98, 99, 100, 101, 103, 104, 105, 106, 111], "ship": [23, 24, 26, 32, 42, 51, 73], "sidewai": [23, 26, 32, 68, 72], "protect": [23, 29, 38, 39, 50, 55, 65], "fly": [23, 28, 52, 68, 87], "saucer": [23, 28, 75], "drop": [23, 30, 111], "bomb": [23, 42, 54, 62, 75], "meaning": [23, 25, 26, 27, 28, 29, 32, 34, 36, 37, 41, 43, 44, 45, 46, 55, 58, 60, 61, 62, 64, 65, 67, 72, 74, 75, 77, 78, 79, 81, 82], "210": [24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 42, 43, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83], "stuck": [24, 33, 52], "maze": [24, 25, 30, 33, 59, 78], "destroi": [24, 26, 28, 29, 30, 31, 32, 33, 36, 37, 38, 39, 42, 43, 51, 57, 68, 69, 70, 73, 74, 75, 77, 87], "egg": 24, "scatter": [24, 66], "simultan": [24, 25], "kill": [24, 33, 52, 57], "flamethrow": 24, "tricki": 24, "situat": [24, 111], "occasion": [24, 28], "power": [24, 52, 86, 87, 92, 100, 101, 106], "pulsar": 24, "temporari": 24, "abil": 24, "score": [24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 52, 53, 54, 55, 56, 57, 63, 64, 65, 66, 67, 68, 69, 71, 75, 76, 77, 81, 85, 87], "prize": [24, 79], "caught": [24, 30], "lose": [24, 27, 29, 38, 41, 42, 45, 52, 54, 63, 64, 66, 68, 69, 71, 72, 73, 87, 108], "consult": [24, 53, 54, 55, 56, 57], "pac": 25, "man": 25, "visit": [25, 45, 86], "enemi": [25, 26, 29, 31, 32, 33, 39, 42, 43, 45, 58, 67, 68, 70, 71, 73, 74, 75, 77, 83], "chicken": [25, 37, 48], "catch": [25, 41, 47, 69], "travers": 25, "vehicl": [26, 31, 46, 55, 106], "mother": [26, 56, 65], "overhead": [26, 87], "deploi": 26, "drone": 26, "dodg": [26, 32, 71], "attack": [26, 28, 29, 32, 40, 42, 65], "lyre": 27, "guid": [27, 48, 106], "award": [27, 33, 38, 41, 45, 71, 100, 101], "spaceship": [28, 42, 73], "field": [28, 106], "break": [28, 36, 86], "appear": [28, 30, 33, 70, 91, 92], "satellit": 28, "ufo": 28, "submerg": 29, "citi": [29, 30, 66, 106], "slowli": 29, "descend": 29, "strike": [29, 34], "defens": [29, 44], "post": 29, "manag": [29, 34], "seven": 29, "fought": 29, "wave": [29, 39, 43, 55, 62, 75], "outer": [29, 89], "robber": 30, "natur": [30, 108, 110], "rob": 30, "getawai": 30, "car": [30, 46, 84, 88, 106], "polic": 30, "chase": [30, 33], "dynamit": [30, 52], "ga": [30, 86], "tank": [30, 31, 71], "four": [30, 41, 86, 87, 95, 97, 105, 111], "nine": [30, 95], "person": [31, 89, 106], "perspect": [31, 106], "3d": [31, 95, 98, 99, 106], "illus": 31, "radar": [31, 82], "travel": 32, "steer": [32, 79, 86], "debri": 32, "leftifir": 32, "evil": [33, 58, 83], "wall": [33, 36, 52, 91, 92], "undefeat": 33, "otto": 33, "tri": 34, "knock": [34, 35], "pin": 34, "spar": 34, "spare": 34, "oppon": [35, 47, 53, 64, 79], "ring": 35, "hit": [35, 36, 37, 38, 43, 65, 66, 69, 70, 72, 108], "land": [35, 69, 87], "punch": [35, 56], "famou": 36, "paddl": [36, 64], "ball": [36, 53, 64, 81], "brick": 36, "wreak": 36, "havoc": 36, "five": [36, 66, 72, 88], "214": 37, "em": 37, "gun": [37, 45], "ammunit": 37, "steal": [37, 47], "bullet": [37, 106], "subtract": 37, "minu": 37, "sign": [37, 100, 101], "elf": 38, "magic": 38, "wand": 38, "fend": 38, "spider": 38, "flea": 38, "mushroom": 38, "forest": 38, "bitten": 38, "tempor": 38, "paralyz": 38, "scorpion": 38, "round": 38, "helicopt": [39, 41, 68], "truck": [39, 69], "convoi": 39, "aircraft": [39, 77], "mini": 39, "bottom": [39, 54, 86, 91, 92, 97, 105, 109], "plane": 39, "surviv": [39, 43], "bank": [40, 68], "heist": 40, "battl": 40, "zone": 40, "beam": [40, 52], "rider": 40, "chopper": 40, "command": [40, 94], "crazi": 40, "climber": 40, "demon": 40, "doubl": [40, 94], "dunk": 40, "elev": 40, "fish": 40, "derbi": 40, "ic": [40, 43, 49, 53], "hockei": [40, 53], "journei": [40, 55], "kung": 40, "fu": 40, "master": [40, 109], "montezuma": 40, "reveng": 40, "pacman": 40, "ey": [40, 61, 66, 106], "road": [40, 86], "runner": 40, "invad": [40, 74], "star": 40, "gunner": 40, "pilot": [40, 62, 83], "pinbal": 40, "wizard": [40, 58], "Of": 40, "wor": 40, "yar": 40, "builid": 41, "obstacl": [41, 55, 56], "damag": [41, 70], "climb": [41, 56, 88, 106], "fast": [41, 86, 94, 96, 98, 100, 104, 106], "least": [41, 76, 87], "row": [41, 74, 109, 110], "earth": [42, 74], "rescu": [42, 52, 56, 57, 58, 71, 73], "smart": 42, "shot": [42, 44, 45, 53, 54, 69, 106], "abduct": 42, "unlimit": 42, "laser": [42, 52, 74, 82], "missil": [42, 68], "aliv": [42, 98, 105], "face": [43, 95, 98, 99, 108], "planet": [43, 51, 73], "krybor": 43, "reserv": [43, 68, 70, 71], "bunker": [43, 51], "grant": [43, 87], "slai": 43, "2v2": 44, "basketbal": 44, "possess": 44, "rival": 44, "team": 44, "rule": [44, 76, 106, 108], "foul": 44, "secret": [45, 66], "ground": [45, 65, 85, 87, 95, 99, 106], "stair": 45, "equip": 45, "against": [45, 64, 76, 106], "floor": 45, "mark": 45, "door": [45, 106], "unreleas": 45, "prototyp": 45, "500": [45, 68, 89, 90, 111], "racer": 46, "nation": 46, "long": [46, 81, 90, 100, 101], "endur": 46, "race": [46, 69, 72, 84], "overtak": 46, "dai": [46, 84], "stai": 46, "meet": 46, "quota": 46, "sunfish": 47, "than": [47, 53, 71, 87, 89, 90, 91, 92, 96, 100, 101, 102, 104, 106, 108], "But": [47, 72], "fisherman": 47, "black": [47, 57, 89], "shark": [47, 61, 71], "lurk": [47, 67], "lane": [48, 106], "busi": 48, "rush": 48, "hour": 48, "traffic": 48, "cross": [48, 110], "bailei": 49, "who": [49, 50, 55, 56, 72], "hop": [49, 67, 97, 105], "forth": 49, "arctic": 49, "river": [49, 68], "block": [49, 106], "white": 49, "he": [49, 51], "hi": [49, 51, 66], "igloo": 49, "shovel": 50, "wield": 50, "farmer": 50, "crop": 50, "carrot": 50, "spacecraft": 51, "fiction": 51, "solar": 51, "system": [51, 89, 93, 100, 101, 106], "landscap": 51, "miner": 52, "mine": [52, 69], "shaft": 52, "tool": [52, 59], "propel": 52, "backpack": 52, "wherev": 52, "blast": [52, 71, 73], "vermin": 52, "raft": 52, "stretch": 52, "critter": 52, "minut": [53, 63], "period": [53, 97, 105], "puck": 53, "angl": [53, 54, 85, 87, 89, 90, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "extrem": [53, 106, 107], "aim": [53, 97, 100, 104, 105], "rink": 53, "realli": 53, "mr": 54, "bond": 54, "multipurpos": 54, "craft": [54, 87], "varieti": [54, 106], "motion": [54, 106], "slightli": [54, 85, 95], "dive": 54, "lob": 54, "rate": [54, 71], "highest": [54, 106], "novic": 54, "006": 54, "007": 54, "lead": 55, "peski": 55, "backstag": 55, "scarab": 55, "000": [55, 68, 71], "concert": 55, "cash": 55, "grasp": 55, "groupi": 55, "photograph": 55, "promot": 55, "encount": [55, 56, 77, 106], "her": [56, 65], "preciou": 56, "babi": 56, "ladder": [56, 85], "bonu": [56, 70, 71, 75, 105], "fruit": 56, "monkei": 56, "corner": 56, "beast": 57, "fortress": [57, 59], "princess": [57, 58], "lyssa": 57, "sunris": 57, "monster": [57, 80], "templ": 58, "victoria": 58, "defeat": [58, 67], "acquir": [59, 94], "treasur": [59, 61, 63, 78, 80], "chamber": [59, 80], "emperor": 59, "deadli": 59, "creatur": [59, 67, 75, 106], "valuabl": 59, "pellet": 60, "ghost": 60, "discov": 61, "octopu": 61, "oxygen": [61, 71], "elimin": [62, 78, 79, 80], "war": 62, "bird": 62, "harri": 63, "jungl": 63, "die": [63, 65, 86], "misfortun": 63, "compet": 64, "deflect": 64, "pig": 65, "piglet": 65, "wolv": 65, "rope": 65, "balloon": 65, "guard": 65, "safe": [65, 87], "eat": [65, 69], "bait": 65, "wolf": 65, "stone": 65, "rock": [65, 69], "french": 66, "pierr": 66, "street": 66, "park": 66, "passag": 66, "dead": 66, "search": [66, 106], "ringlead": 66, "henri": 66, "le": 66, "fiend": 66, "gang": 66, "evid": 66, "stolen": 66, "good": 66, "statut": 66, "expir": 66, "nab": 66, "question": [66, 106], "auto": 66, "pothol": 66, "bert": 67, "cube": 67, "pyramid": 67, "destin": [67, 111], "nasti": 67, "jet": 68, "fli": 68, "fuel": [68, 73, 87], "depot": 68, "collid": [68, 71, 87], "squadron": [68, 70], "tanker": 68, "80": 68, "tm": 69, "outrun": 69, "wile": 69, "coyot": 69, "hazard": 69, "desert": 69, "rocket": [69, 70, 87], "cannon": [69, 74], "cliff": [69, 107], "steel": 69, "pile": 69, "birdse": 69, "cannonbal": 69, "scrambl": 70, "static": 70, "interfer": 70, "sensor": [70, 86], "report": [70, 85, 95, 98, 99], "flash": 70, "panel": 70, "earn": 70, "twelv": 70, "torpedo": 71, "diver": 71, "killer": 71, "deliv": [71, 111], "six": [71, 105], "explod": 71, "anyth": 71, "decreas": [71, 87], "almost": 71, "yoursub": 71, "blow": 71, "forc": [71, 73, 87, 90, 91, 92, 95, 98, 99, 100, 101], "less": [71, 85, 87, 100, 104], "worth": [71, 74], "90": 71, "moment": 71, "skier": 72, "gate": [72, 106], "fastest": 72, "miss": [72, 89, 111], "tree": 72, "slalom": 72, "penalti": 72, "warp": 73, "sector": 73, "feder": [73, 106], "zylon": 73, "refuel": 73, "cadet": 73, "corridor": 73, "mania": [75, 77], "orang": 76, "win": [76, 108], "margin": 76, "ti": 76, "sport": 76, "till": 76, "technologi": 77, "increasingli": 77, "futur": 77, "difficult": [77, 90, 94, 100, 101], "rack": 78, "tomb": 78, "guardian": 78, "baja": 79, "bugger": 79, "dungeon": 80, "beat": [82, 108], "scanner": 82, "armi": 83, "enslav": 83, "galaxi": 83, "fighter": 83, "lunar": 84, "lander": 84, "toi": [84, 106, 108, 109, 110, 111], "contribut": 84, "earli": [84, 106], "oleg": [84, 85, 86, 87], "klimov": [84, 85, 86, 87], "popular": [84, 106], "benchmark": [84, 106], "ever": 84, "joint": [85, 87, 89, 90, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "uneven": 85, "terrain": [85, 106], "hardcor": 85, "stump": 85, "1600": 85, "heurist": [85, 87], "demonstr": 85, "hip": [85, 95, 98, 99], "knee": [85, 98, 99], "hull": 85, "angular": [85, 87, 89, 90, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "leg": [85, 87, 95, 97, 98, 99, 105, 106], "contact": [85, 87, 94, 95, 98, 99, 100], "lidar": [85, 106], "rangefind": 85, "measur": [85, 93, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105, 106], "far": [85, 86, 100, 102, 103, 106], "better": 85, "stand": [85, 94, 95, 98, 99, 100, 101], "slight": 85, "exce": [85, 108], "closest": 85, "trace": 85, "furthest": 85, "faster": [85, 87, 99], "spent": [85, 87], "higher": 85, "friction": [85, 104, 106], "nervous": 85, "easiest": 86, "ab": [86, 106], "wheel": 86, "gyroscop": 86, "car_rac": 86, "rear": 86, "drive": [86, 111], "noth": [86, 87], "brake": 86, "96x96": 86, "tile": 86, "732": 86, "926": 86, "rest": [86, 87, 97, 105], "playfield": 86, "lap_complete_perc": 86, "dictat": [86, 87], "percentag": 86, "lap": 86, "domain_random": 86, "scenario": [86, 106], "background": 86, "demand": 86, "correspondingli": 86, "scheme": [86, 106], "chri": 86, "campbel": 86, "2014": 86, "www": 86, "iforce2d": 86, "net": [86, 108], "b2dtut": 86, "pontryagin": 87, "principl": 87, "engin": [87, 94], "throttl": 87, "why": 87, "pad": 87, "lunar_land": 87, "orient": [87, 95, 98, 99], "sum": [87, 95, 96, 97, 98, 99, 102, 103, 104, 105, 106, 108], "closer": [87, 108], "slower": 87, "tilt": 87, "03": 87, "solut": 87, "viewport": 87, "mass": [87, 95, 96, 98, 99, 104, 106], "bodi": [87, 94, 95, 96, 97, 98, 99, 100, 101, 104, 105], "moon": 87, "greater": [87, 89, 90, 91, 92, 96, 101, 102, 104, 108], "awak": 87, "group": 87, "come": [87, 95, 96, 97, 98, 99, 100, 101, 104, 105, 106], "sleep": 87, "littl": [87, 99], "cpu": 87, "wake": 87, "attach": [87, 90, 93, 95, 105], "enable_wind": 87, "wind_pow": 87, "turbulence_pow": 87, "later": 87, "booster": 87, "gravit": 87, "wind": 87, "tanh": 87, "sin": [87, 93, 100], "pi": [87, 89, 93], "9999": 87, "rotat": [87, 89, 95, 98, 99, 102], "turbul": 87, "renorm": 87, "harder": 87, "push": [87, 90, 100, 101, 106], "cart": [88, 100, 101], "mountain": 88, "nois": [88, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "regard": 88, "underpow": 88, "effort": 88, "easier": 88, "ones": [88, 94], "57": 89, "coars": 89, "barto": [89, 90, 100, 101, 108, 109], "book": [89, 108], "link": [89, 95, 96, 97, 98, 99, 103, 104], "linearli": [89, 100, 101], "actuat": [89, 90, 98, 99], "swing": [89, 93], "free": [89, 93, 94, 95, 98, 99, 100, 101, 106], "height": [89, 97, 100, 105], "hang": 89, "downward": 89, "seen": [89, 96, 106], "green": 89, "cosin": [89, 100, 103], "theta1": 89, "sine": [89, 100, 103], "theta2": 89, "567": 89, "274": 89, "4\u03c0": 89, "9\u03c0": 89, "rad": [89, 90, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "few": 89, "incur": [89, 109], "introduct": [89, 108, 109], "book_or_nip": 89, "neurip": [89, 106], "paper": [89, 100, 106], "nip": [89, 106], "equat": [89, 93], "confirm": 89, "experiment": [89, 106], "radian": [89, 90, 93, 101], "1996": 89, "touretzki": 89, "mozer": 89, "hasselmo": 89, "ed": [89, 111], "vol": 89, "mit": 89, "proceed": 89, "cc": 89, "1995": 89, "8f1d43620bc6bb580df6e80b0dc05c48": 89, "pdf": 89, "anderson": [90, 100, 101], "neuronlik": [90, 100, 101], "adapt": [90, 100, 101, 109], "That": 90, "un": 90, "frictionless": 90, "balanc": [90, 100, 101], "vari": [90, 100, 101, 106], "418": 90, "untermin": 90, "2095": 90, "allot": 90, "475": 90, "05": [90, 95, 96, 102], "07": [91, 92], "sinusoid": [91, 92], "vallei": [91, 92], "strateg": [91, 92], "hill": [91, 92], "andrew": [91, 92], "moor": [91, 92], "phd": [91, 92, 104], "thesi": [91, 92, 104], "1990": [91, 92], "techreport": [91, 92], "moore90efficientmemori": [91, 92], "author": [91, 92], "william": [91, 92], "institut": [91, 92], "univers": [91, 92], "cambridg": [91, 92], "year": [91, 92], "001": [91, 93, 97, 100, 105], "0025": [91, 92], "collis": [91, 92], "inelast": [91, 92], "upon": [91, 92], "quickli": [91, 106], "penalis": [91, 92, 95, 96, 97, 98, 99, 100, 102, 103, 104, 105], "0015": 92, "45": [92, 99, 102], "999": 92, "invert": [93, 94], "swingup": 93, "theori": [93, 100, 106], "diagram": 93, "meter": 93, "theta": 93, "tau": 93, "counter": 93, "clockwis": 93, "theta_dt": 93, "heta": 93, "2736044": 93, "calcul": [93, 94, 95, 98, 99, 100, 102, 103, 110], "simplifi": [93, 106], "math": 93, "half": 94, "cheetah": 94, "standup": 94, "facilit": [94, 106], "develop": 94, "biomechan": 94, "graphic": [94, 106], "anim": 94, "area": 94, "accur": [94, 106], "octob": 94, "2021": [94, 106], "deepmind": [94, 106], "2022": 94, "everyon": 94, "websit": [94, 106], "framework": 94, "ten": [94, 108], "iverteddoublependulum": 94, "gaussian": 94, "mjsim": 94, "qpo": 94, "qvel": [94, 98, 99], "indirectli": 94, "xml": [94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "tweak": [94, 104], "schulman": 95, "moritz": 95, "levin": 95, "jordan": 95, "abbeel": 95, "torso": [95, 96, 97, 98, 99, 105], "eight": 95, "hing": [95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "rotor": [95, 96, 97, 98, 99, 104, 105], "front": [95, 96, 104, 106], "hip_1": [95, 98, 99], "front_left_leg": [95, 98, 99], "angle_1": [95, 98, 99], "hip_2": [95, 98, 99], "front_right_leg": [95, 98, 99], "angle_2": 95, "hip_3": 95, "back_leg": 95, "angle_3": 95, "hip_4": 95, "right_back_leg": 95, "angle_4": 95, "deriv": [95, 96, 97, 98, 99, 100, 101, 104, 105], "exclude_current_positions_from_observ": [95, 96, 97, 98, 104, 105], "113": 95, "x_posit": [95, 96, 97, 98, 104, 105], "y_posit": [95, 98, 104], "111": 95, "centr": [95, 98, 99], "ankle_1": 95, "ankle_2": 95, "ankle_3": 95, "ankle_4": 95, "19": [95, 98, 99, 102], "dof": [95, 98, 99], "quaternion": [95, 98, 99], "healthy_reward": [95, 97, 98, 105], "healthi": [95, 97, 98, 105], "forward_reward": [95, 96, 97, 98, 104, 105], "dt": [95, 96, 97, 98, 102, 103, 104, 105], "frametim": [95, 96, 97, 98, 104, 105], "ctrl_cost": [95, 96, 97, 98, 104, 105], "too": [95, 96, 97, 98, 99, 100, 102, 103, 104, 105], "ctrl_cost_weight": [95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "ctr_cost_weight": 95, "contact_cost": [95, 98], "contact_cost_weight": [95, 98], "contact_force_rang": 95, "reset_noise_scal": [95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "deviat": [95, 96, 100, 104], "intention": [95, 98, 99], "therebi": [95, 98, 99], "said": [95, 97, 98, 105], "unhealthi": [95, 97, 98, 105], "healthy_z_rang": [95, 97, 98, 105], "terminate_when_unhealthi": [95, 97, 98, 105], "xml_file": [95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "path": [95, 96, 97, 98, 102, 103, 104, 105], "model": [95, 96, 97, 98, 104, 105, 106], "5e": [95, 97, 98, 105], "perturb": [95, 96, 97, 98, 104, 105], "exclud": [95, 96, 97, 98, 104, 105], "induct": [95, 96, 97, 98, 104, 105], "bia": [95, 96, 97, 98, 104, 105], "induc": [95, 96, 97, 98, 104, 105], "agnost": [95, 96, 97, 98, 99, 104, 105], "bind": [95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "camera": [95, 96, 97, 98, 99, 100, 101, 104, 105, 106], "mujoco_pi": [95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "max_time_step": [95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "wawrzy\u0144ski": 96, "cat": 96, "paw": 96, "alloc": 96, "thigh": [96, 97, 98, 99, 105], "shin": [96, 98, 99], "feet": [96, 105], "bthigh": 96, "bshin": 96, "bfoot": 96, "fthigh": 96, "fshin": 96, "ffoot": 96, "tip": [96, 100, 104], "rootz": [96, 97, 105], "slide": [96, 97, 100, 101, 102, 103, 104, 105], "rooti": [96, 97, 105], "rootx": [96, 97, 105], "forward_reward_weight": [96, 97, 98, 104, 105], "half_cheetah": 96, "erez": [97, 98, 99, 105], "tassa": [97, 98, 99, 105], "todorov": [97, 98, 99, 105], "predict": [97, 105], "nonlinear": [97, 105], "compar": [97, 104, 105], "figur": [97, 105], "middl": [97, 105], "thigh_joint": [97, 105], "leg_joint": [97, 105], "foot_joint": [97, 105], "002": [97, 105], "008": [97, 105], "healthy_state_rang": 97, "fallen": 97, "healthy_angle_rang": [97, 105], "376": [98, 99], "synthesi": [98, 99, 106], "onlin": [98, 99, 106], "abdomen": [98, 99], "arm": [98, 99, 102, 103, 106], "elbow": [98, 99, 102], "right_hip_x": [98, 99], "right_thigh": [98, 99], "right_hip_z": [98, 99], "right_hip_i": [98, 99], "right_kne": [98, 99], "left_hip_x": [98, 99], "left_thigh": [98, 99], "left_hip_z": [98, 99], "left_hip_i": [98, 99], "left_kne": [98, 99], "right_shoulder1": [98, 99], "right_shoulder2": [98, 99], "right_elbow": [98, 99], "left_shoulder1": [98, 99], "left_shoulder2": [98, 99], "left_elbow": [98, 99], "378": 98, "root": [98, 99], "lower_waist": [98, 99], "abdomen_z": [98, 99], "abdomen_i": [98, 99], "pelvi": [98, 99], "abdomen_x": [98, 99], "right_upper_arm": [98, 99], "right_lower_arm": [98, 99], "left_upper_arm": [98, 99], "left_lower_arm": [98, 99], "anglular": [98, 99, 101], "29": [98, 99], "aanglular": [98, 99], "33": [98, 99], "34": 98, "35": [98, 99], "37": [98, 99], "39": [98, 99], "41": [98, 99], "43": [98, 99], "velocitti": 98, "addition": [98, 99], "cinert": [98, 99], "inertia": [98, 99], "rigid": [98, 99], "intermedi": [98, 99], "nbodi": [98, 99], "henc": [98, 99, 107], "140": [98, 99], "cvel": [98, 99], "qfrc_actuat": [98, 99], "constraint": [98, 99, 100, 106], "nv": [98, 99], "cfrc_ext": [98, 99], "dim": [98, 99], "003": 98, "015": 98, "nu": [98, 99], "contact_cost_rang": 98, "lai": 99, "state_spac": 99, "uph_cost": 99, "upward": 99, "absolut": [99, 101, 105], "overal": 99, "atom": 99, "though": 99, "inflat": 99, "quad_ctrl_cost": 99, "quad_impact_cost": 99, "000001": 99, "105": 99, "unlik": [99, 100, 101, 102, 103], "beyond": [99, 100, 101, 102, 103, 105], "slider": [100, 101], "unitless": [100, 103], "hinge2": 100, "realist": [100, 106], "accuraci": [100, 106], "analyt": 100, "alive_bonu": 100, "distance_penalti": 100, "velocity_penalti": 100, "005": [100, 102, 103], "y_coordin": 100, "196": 100, "perpendicularli": 100, "cylind": 102, "effector": [102, 103], "fingertip": [102, 103], "shoulder": 102, "forearm": 102, "wrist": 102, "pan": 102, "r_shoulder_pan_joint": 102, "lift": 102, "r_shoulder_lift_joint": 102, "r_upper_arm_roll_joint": 102, "flex": 102, "r_elbow_flex_joint": 102, "r_forearm_roll_joint": 102, "r_wrist_flex_joint": 102, "r_wrist_roll_joint": 102, "analogi": 102, "tips_arm": 102, "obj_slidex": 102, "obj_slidei": 102, "goal_slidex": 102, "goal_slidei": 102, "sphere": 102, "reward_near": 102, "unattach": [102, 103], "reward_control": [102, 103], "euclidean": [102, 103], "perman": 102, "323": 102, "rise": 102, "asset": [102, 103], "gymnasmium": 102, "fixtur": 103, "joint0": 103, "joint1": 103, "target_x": 103, "target_i": 103, "position_fingertip": 103, "position_target": 103, "na": [103, 106], "disk": 103, "radiu": 103, "everyth": 103, "02": 103, "r\u00e9mi": 104, "coulom": 104, "applic": [104, 106], "segment": 104, "articul": [104, 106], "suspend": 104, "subject": [104, 106], "fluid": 104, "viscou": 104, "coeffici": 104, "motor1_rot": 104, "motor2_rot": 104, "\u03b8": 104, "free_body_rot": 104, "slider1": 104, "slider2": 104, "04": 104, "swim": 104, "split": 105, "thigh_left_joint": 105, "leg_left_joint": 105, "foot_left_joint": 105, "ctr_cost": 105, "doom": 106, "focus": 106, "visual": 106, "thousand": 106, "depth": 106, "annot": 106, "label": 106, "2016": 106, "cite": 106, "huge": 106, "3v3": 106, "hundr": 106, "roughli": 106, "tweakabl": 106, "monei": 106, "minecraft": 106, "challeng": 106, "procedur": 106, "generaliz": 106, "skill": 106, "slime": 106, "volleybal": 106, "motiv": 106, "maintain": [106, 112], "premad": 106, "imperfect": 106, "twisti": 106, "puzzl": 106, "weiqi": 106, "famous": 106, "conquer": 106, "alphago": 106, "synthes": 106, "neuro": 106, "architectur": 106, "integr": 106, "twin": 106, "concept": 106, "seamless": 106, "hardwar": 106, "world": [106, 111], "firmwar": 106, "neuroflight": 106, "extens": 106, "ro": 106, "thrust": 106, "ascend": 106, "shall": 106, "altitud": 106, "aerodynam": 106, "drag": 106, "light": 106, "poli": 106, "pinocchio": 106, "meshcat": 106, "web": 106, "minimalist": 106, "interior": 106, "room": 106, "hallwai": 106, "offic": 106, "home": 106, "dmlab": 106, "bitcraz": 106, "crazyfli": 106, "nanoquadrotor": 106, "mar": 106, "endeavor": 106, "gap": 106, "methodologi": 106, "coverag": 106, "commerci": 106, "mac": 106, "linux": 106, "laboratori": 106, "internet": 106, "ego": 106, "cloud": 106, "semant": 106, "project": 106, "cours": 106, "wide": 106, "account": 106, "yield": 106, "voltag": 106, "duti": 106, "cycl": 106, "emphasi": 106, "percept": 106, "social": 106, "driver": 106, "uncertain": 106, "propos": 106, "merg": 106, "intersect": 106, "roundabout": 106, "longitudin": 106, "comprehens": 106, "conduct": 106, "akin": 106, "anomali": 106, "inject": 106, "studi": 106, "robust": 106, "brax": 106, "compil": 106, "llvm": 106, "phase": 106, "gcc": 106, "cuda": 106, "hyperparamet": 106, "cheap": 106, "surrog": 106, "evolutionari": 106, "obsolet": 106, "windygrid": 106, "bandit": 106, "server": 106, "advertis": 106, "greedi": 106, "ucb1": 106, "trade": 106, "great": 106, "focu": 106, "simplic": 106, "autom": 106, "deduct": 106, "verif": 106, "minatar": 106, "metatrad": 106, "unus": 106, "techniqu": 106, "hard": 106, "strive": 106, "novel": 106, "transport": 106, "warehous": 106, "storag": 106, "overfit": 106, "mathemat": 106, "dataset": 106, "arxiv": 106, "2107": 106, "07373": 106, "baselin": 106, "expos": 106, "blockqnn": 106, "wise": 106, "nsc": 106, "cifar": 106, "meta": 106, "tag": 106, "answer": 106, "classif": 106, "omg": 106, "toolbox": 106, "electron": 106, "musculoskelet": 106, "opensim": 106, "physiolog": 106, "competit": 106, "2017": 106, "foss": 106, "interoper": 106, "quantum": 106, "circuit": 106, "wire": 106, "qubit": 106, "googl": 106, "quantumai": 106, "cirq": 106, "quadrotor": 106, "casadi": 106, "priori": 106, "taobao": 106, "largest": 106, "commerc": 106, "morl": 106, "equiti": 106, "market": 106, "acm": 106, "icaif21": 106, "public": 106, "financi": 106, "daili": 106, "investor": 106, "respons": 106, "theorem": 106, "prover": 106, "vampir": 106, "theoret": 106, "workshop": 106, "f1tenth": 106, "unoffici": 106, "baselines3": 106, "trackmania": 106, "2020": 106, "latent": 106, "imagin": 106, "miniatur": 106, "racecar": 106, "portabl": 106, "evolut": 106, "torc": 106, "wireless": 106, "elastica": 106, "assembli": 106, "slender": 106, "cosserat": 106, "rod": 106, "supertuxkart": 106, "accompani": 106, "ostrich": 106, "bio": 106, "mechan": 106, "locomot": 106, "soft": 106, "snake": 106, "propuls": 106, "music": 106, "dual": 106, "dexter": 106, "hand": 106, "isaac": 106, "omnivers": 106, "rust": 106, "jax": 106, "frozen": 107, "lake": 107, "suitabl": 107, "card": 108, "dealer": 108, "jack": 108, "queen": 108, "king": 108, "ac": 108, "usabl": 108, "deck": 108, "decid": [108, 110], "bust": 108, "reveal": 108, "facedown": 108, "goe": 108, "outcom": 108, "incompleteidea": 108, "2nd": 108, "html": 108, "sab": 108, "48": 109, "106": 109, "With": 109, "inspir": 109, "dennybritz": 109, "blob": 109, "cliff_walk": 109, "board": 109, "4x12": 109, "3x12": 109, "fact": 109, "slipperi": 110, "dir": 110, "current_row": 110, "nrow": 110, "current_col": 110, "col": 110, "4x4": 110, "desc": 110, "map_nam": 110, "sfff": 110, "fhfh": 110, "fffh": 110, "hffg": 110, "generate_random_map": 110, "toy_text": 110, "frozen_lak": 110, "preload": 110, "8x8": 110, "sfffffff": 110, "ffffffff": 110, "fffhffff": 110, "fffffhff": 110, "fhhfffhf": 110, "fhffhfhf": 110, "fffhfffg": 110, "perpendicular": 110, "bug": [110, 111], "maxq": 111, "decomposit": 111, "tom": 111, "dietterich": 111, "reen": 111, "ellow": 111, "lue": 111, "passeng": 111, "south": 111, "north": 111, "east": 111, "west": 111, "pickup": 111, "404": 111, "reachabl": 111, "taxi_row": 111, "taxi_col": 111, "passenger_loc": 111, "decod": 111, "action_mask": 111, "Or": 111, "q_valu": 111, "illeg": 111, "cleaner": 111, "disallow": 111, "loc": 111, "passidx": 111, "capabl": 112}, "objects": {"Space": [[4, 0, 1, "", "dtype"]], "": [[10, 1, 1, "", "action_space"], [10, 1, 1, "", "observation_space"], [10, 1, 1, "", "single_action_space"], [10, 1, 1, "", "single_observation_space"]], "gymnasium": [[12, 2, 1, "", "ActionWrapper"], [2, 2, 1, "", "Env"], [14, 2, 1, "", "ObservationWrapper"], [15, 2, 1, "", "RewardWrapper"], [11, 2, 1, "", "Wrapper"], [3, 3, 1, "", "make"], [3, 3, 1, "", "register"], [3, 3, 1, "", "spec"]], "gymnasium.ActionWrapper.ActionWrapper": [[12, 3, 1, "", "action"]], "gymnasium.Env": [[2, 1, 1, "", "action_space"], [2, 3, 1, "", "close"], [2, 1, 1, "", "metadata"], [2, 0, 1, "", "np_random"], [2, 1, 1, "", "observation_space"], [2, 3, 1, "", "render"], [2, 1, 1, "", "render_mode"], [2, 3, 1, "", "reset"], [2, 1, 1, "", "reward_range"], [2, 1, 1, "", "spec"], [2, 3, 1, "", "step"], [2, 0, 1, "", "unwrapped"]], "gymnasium.ObservationWrapper": [[14, 3, 1, "", "observation"]], "gymnasium.RewardWrapper.RewardWrapper": [[15, 3, 1, "", "reward"]], "gymnasium.Wrapper": [[11, 0, 1, "", "action_space"], [11, 3, 1, "", "close"], [11, 0, 1, "", "metadata"], [11, 0, 1, "", "np_random"], [11, 0, 1, "", "observation_space"], [11, 3, 1, "", "reset"], [11, 0, 1, "", "reward_range"], [11, 0, 1, "", "spec"], [11, 3, 1, "", "step"], [11, 0, 1, "", "unwrapped"]], "gymnasium.spaces": [[6, 2, 1, "", "Box"], [5, 2, 1, "", "Dict"], [6, 2, 1, "", "Discrete"], [5, 2, 1, "", "Graph"], [6, 2, 1, "", "MultiBinary"], [6, 2, 1, "", "MultiDiscrete"], [5, 2, 1, "", "Sequence"], [4, 2, 1, "", "Space"], [6, 2, 1, "", "Text"], [5, 2, 1, "", "Tuple"]], "gymnasium.spaces.Box": [[6, 4, 1, "", "is_bounded"], [6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Dict": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.Discrete": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Graph": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.MultiBinary": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.MultiDiscrete": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Sequence": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.Text": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Tuple": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.space.Space": [[4, 3, 1, "", "contains"], [4, 3, 1, "", "from_jsonable"], [4, 3, 1, "", "sample"], [4, 3, 1, "", "seed"], [4, 0, 1, "", "shape"], [4, 3, 1, "", "to_jsonable"]], "gymnasium.spaces.utils": [[7, 3, 1, "", "flatdim"], [7, 3, 1, "", "flatten"], [7, 3, 1, "", "flatten_space"], [7, 3, 1, "", "unflatten"]], "gymnasium.utils.env_checker": [[9, 3, 1, "", "check_env"]], "gymnasium.utils.play": [[9, 2, 1, "", "PlayPlot"], [9, 2, 1, "", "PlayableGame"], [9, 3, 1, "", "play"]], "gymnasium.utils.play.PlayPlot": [[9, 4, 1, "", "callback"]], "gymnasium.utils.play.PlayableGame": [[9, 4, 1, "", "process_event"]], "gymnasium.utils.save_video": [[9, 3, 1, "", "capped_cubic_video_schedule"], [9, 3, 1, "", "save_video"]], "gymnasium.utils.seeding": [[9, 3, 1, "", "np_random"]], "gymnasium.utils.step_api_compatibility": [[9, 3, 1, "", "convert_to_done_step_api"], [9, 3, 1, "", "convert_to_terminated_truncated_step_api"], [9, 3, 1, "", "step_api_compatibility"]], "gymnasium.vector": [[10, 2, 1, "", "AsyncVectorEnv"], [10, 2, 1, "", "SyncVectorEnv"], [10, 2, 1, "", "VectorEnv"], [10, 3, 1, "", "make"]], "gymnasium.vector.VectorEnv": [[10, 4, 1, "", "close"], [10, 4, 1, "", "reset"], [10, 4, 1, "", "step"]], "gymnasium.vector.utils": [[8, 3, 1, "", "batch_space"], [8, 3, 1, "", "concatenate"], [8, 3, 1, "", "create_empty_array"], [8, 3, 1, "", "create_shared_memory"], [8, 3, 1, "", "iterate"], [8, 3, 1, "", "read_from_shared_memory"], [8, 3, 1, "", "write_to_shared_memory"]], "gymnasium.wrappers": [[13, 2, 1, "", "AtariPreprocessing"], [13, 2, 1, "", "AutoResetWrapper"], [12, 2, 1, "", "ClipAction"], [13, 2, 1, "", "EnvCompatibility"], [14, 2, 1, "", "FilterObservation"], [14, 2, 1, "", "FlattenObservation"], [14, 2, 1, "", "FrameStack"], [14, 2, 1, "", "GrayScaleObservation"], [13, 2, 1, "", "HumanRendering"], [14, 2, 1, "", "NormalizeObservation"], [15, 2, 1, "", "NormalizeReward"], [13, 2, 1, "", "OrderEnforcing"], [13, 2, 1, "", "PassiveEnvChecker"], [14, 2, 1, "", "PixelObservationWrapper"], [13, 2, 1, "", "RecordEpisodeStatistics"], [13, 2, 1, "", "RecordVideo"], [13, 2, 1, "", "RenderCollection"], [12, 2, 1, "", "RescaleAction"], [14, 2, 1, "", "ResizeObservation"], [13, 2, 1, "", "StepAPICompatibility"], [14, 2, 1, "", "TimeAwareObservation"], [13, 2, 1, "", "TimeLimit"], [14, 2, 1, "", "TransformObservation"], [15, 2, 1, "", "TransformReward"], [13, 2, 1, "", "VectorListInfo"]]}, "objtypes": {"0": "py:property", "1": "py:attribute", "2": "py:class", "3": "py:function", "4": "py:method"}, "objnames": {"0": ["py", "property", "Python property"], "1": ["py", "attribute", "Python attribute"], "2": ["py", "class", "Python class"], "3": ["py", "function", "Python function"], "4": ["py", "method", "Python method"]}, "titleterms": {"404": 0, "page": [0, 1], "Not": 0, "found": 0, "The": [0, 106], "request": 0, "could": 0, "gymnasium": [1, 2, 10, 11, 17, 112], "doc": 1, "instruct": 1, "modifi": 1, "environ": [1, 2, 3, 9, 10, 13, 16, 17, 18, 20, 106, 112], "edit": 1, "an": [1, 16], "ad": 1, "new": [1, 9], "atari": [1, 13, 21, 40], "env": [1, 2, 10, 16, 17, 106], "non": 1, "other": [1, 106], "step": [1, 9, 16, 17, 18], "build": 1, "document": 1, "method": [2, 4, 10, 11], "attribut": [2, 4, 10, 11], "addit": 2, "implement": [2, 11], "registri": 3, "make": [3, 10, 17], "regist": [3, 17], "all": 3, "spec": 3, "space": [4, 5, 6, 7, 8, 16, 20, 21, 47, 48, 49, 50, 51, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 110], "fundament": [4, 6], "composit": [4, 5], "util": [4, 7, 8, 9], "vector": [4, 8, 10, 13, 20], "dict": 5, "tupl": 5, "sequenc": 5, "graph": 5, "box": [6, 35], "discret": 6, "multibinari": 6, "multidiscret": 6, "text": [6, 107], "share": [8, 20], "memori": [8, 20], "visual": 9, "save": 9, "render": [9, 13, 17], "video": [9, 13, 81, 106], "old": 9, "api": [9, 16, 18, 112], "compat": [9, 13, 16, 18], "seed": 9, "check": [9, 16], "vectorenv": 10, "async": 10, "sync": 10, "wrapper": [11, 12, 13, 14, 15, 16, 17], "custom": [11, 17, 20], "action": [12, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111], "clip": 12, "rescal": 12, "misc": 13, "preprocess": 13, "autoreset": 13, "passiv": 13, "checker": 13, "human": 13, "order": 13, "enforc": 13, "record": 13, "episod": [13, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "statist": 13, "collect": [13, 112], "time": [13, 14, 19], "limit": [13, 19], "list": [13, 40], "info": [13, 111], "observ": [14, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111], "transform": [14, 15], "filter": 14, "flatten": 14, "framestack": 14, "grai": 14, "scale": 14, "normal": [14, 15], "pixel": 14, "resiz": 14, "awar": 14, "reward": [15, 21, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111], "basic": 16, "usag": [16, 20], "initi": [16, 17], "interact": 16, "chang": 16, "backward": 16, "conform": 16, "plai": 16, "within": 16, "your": [17, 20], "own": 17, "subclass": 17, "declar": 17, "construct": 17, "from": 17, "state": [17, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "reset": [17, 86], "close": 17, "creat": [17, 20], "packag": 17, "instanc": 17, "us": 17, "gym": [18, 106], "load": 18, "openai": [18, 106], "v0": 18, "22": 18, "handl": [19, 20], "termin": [19, 85, 86, 87], "truncat": [19, 93], "import": 19, "learn": [19, 106, 112], "code": 19, "solut": 19, "work": 20, "intermedi": 20, "except": 20, "advanc": 20, "autorom": 21, "instal": 21, "rom": 21, "stochast": 21, "common": 21, "argument": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111], "version": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111], "histori": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 110, 111], "name": [21, 61], "scheme": 21, "flavor": 21, "refer": [21, 86, 89, 112], "adventur": 22, "descript": [22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 108, 109, 111], "air": 23, "raid": 23, "alien": 24, "amidar": 25, "assault": 26, "asterix": 27, "asteroid": 28, "atlanti": 29, "bank": 30, "heist": 30, "battl": 31, "zone": 31, "beam": 32, "rider": 32, "berzerk": 33, "bowl": 34, "breakout": 36, "carniv": 37, "centiped": 38, "chopper": 39, "command": 39, "complet": 40, "crazi": 41, "climber": 41, "defend": 42, "demon": 43, "attack": 43, "doubl": [44, 100], "dunk": 44, "elev": 45, "enduro": 46, "fishingderbi": 47, "freewai": 48, "frostbit": 49, "gopher": 50, "gravitar": 51, "hero": 52, "icehockei": 53, "jamesbond": 54, "journeyescap": 55, "kangaroo": 56, "krull": 57, "kung": 58, "fu": 58, "master": 58, "montezuma": 59, "reveng": 59, "m": 60, "pacman": 60, "thi": 61, "game": [61, 106], "phoenix": 62, "pitfal": 63, "pong": 64, "pooyan": 65, "privateey": 66, "qbert": 67, "riverraid": 68, "road": 69, "runner": 69, "robot": [70, 106], "tank": 70, "seaquest": 71, "ski": 72, "solari": 73, "spaceinvad": 74, "stargunn": 75, "tenni": 76, "timepilot": 77, "tutankham": 78, "up": 79, "n": 79, "down": 79, "ventur": 80, "pinbal": 81, "wizard": 82, "wor": 82, "zaxxon": 83, "box2d": 84, "biped": 85, "walker": 85, "start": [85, 86, 87, 89, 90, 91, 92, 93, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "credit": [85, 86, 87], "car": [86, 91, 92], "race": [86, 106], "lunar": 87, "lander": 87, "classic": [88, 106], "control": [88, 106], "acrobot": 89, "end": [89, 90, 91, 92, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105], "cart": 90, "pole": 90, "mountain": [91, 92], "transit": [91, 92], "dynam": [91, 92], "continu": 92, "pendulum": [93, 100, 101], "mujoco": 94, "ant": 95, "half": 96, "cheetah": 96, "hopper": 97, "humanoid": [98, 99], "standup": 99, "invert": [100, 101], "pusher": 102, "reacher": 103, "swimmer": 104, "note": 104, "walker2d": 105, "third": 106, "parti": 106, "vizdoom": 106, "flappi": 106, "bird": 106, "A": 106, "derk": 106, "gpu": 106, "acceler": 106, "moba": 106, "minerl": 106, "procgen": 106, "slimevolleygym": 106, "simpl": 106, "singl": 106, "multi": 106, "agent": 106, "reinforc": [106, 112], "stabl": 106, "retro": 106, "uniti": 106, "ml": 106, "board": 106, "card": 106, "etc": 106, "abalon": 106, "two": 106, "player": 106, "abstract": 106, "strategi": 106, "spoof": 106, "xiangqi": 106, "chines": 106, "chess": 106, "rubikscubegym": 106, "gymgo": 106, "gymfc": 106, "flight": 106, "tune": 106, "train": 106, "framework": 106, "gazebo": 106, "goddard": 106, "": 106, "rocket": 106, "problem": 106, "jimini": 106, "miniworld": 106, "pybullet": 106, "drone": 106, "marsexplor": 106, "panda": 106, "robo": 106, "offworld": 106, "autonom": 106, "drive": 106, "traffic": 106, "carla": 106, "duckietown": 106, "electr": 106, "motor": 106, "highwai": 106, "longicontrol": 106, "sumo": 106, "rl": 106, "commonroad": 106, "pettingzoo": 106, "anomalous_rl_env": 106, "carl": 106, "compilergym": 106, "dacbench": 106, "gridworld": 106, "adserv": 106, "algorithm": 106, "anytrad": 106, "autokei": 106, "ccc": 106, "cellular": 106, "automata": 106, "inventori": 106, "maze": 106, "mtsim": 106, "legaci": 106, "toytext": 106, "riverswim": 106, "recsi": 106, "sokoban": 106, "math": 106, "prog": 106, "synth": 106, "nasgym": 106, "nlpgym": 106, "toolkit": 106, "develop": 106, "solv": 106, "nlp": 106, "task": 106, "obstacl": 106, "tower": 106, "openmodelica": 106, "microgrid": 106, "osim": 106, "pge": 106, "parallel": 106, "engin": 106, "qasgym": 106, "safe": 106, "virtualtaobao": 106, "mo": 106, "abid": 106, "satur": 106, "shinrl": 106, "go": 106, "explor": 106, "tmrl": 106, "racing_dream": 106, "racecar_gym": 106, "evogym": 106, "design": 106, "tool": 106, "l2r": 106, "gym_torc": 106, "mobil": 106, "softrobot": 106, "pyelastica": 106, "tuxkart": 106, "ai": 106, "ostrichrl": 106, "quadrup": 106, "pogo": 106, "stick": 106, "jump": 106, "igibson": 106, "snakerl": 106, "starship": 106, "land": 106, "raveforc": 106, "line": 106, "follow": 106, "dexteroushand": 106, "omniisaacgymenv": 106, "border": 106, "spacerobotenv": 106, "gymnax": 106, "toi": 107, "blackjack": 108, "cliff": 109, "walk": 109, "frozen": 110, "lake": 110, "taxi": 111, "i": 112, "standard": 112, "divers": 112}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 8, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx": 57}, "alltitles": {"404 - Page Not Found": [[0, "page-not-found"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Gymnasium-docs": [[1, "gymnasium-docs"]], "Instructions for modifying environment pages": [[1, "instructions-for-modifying-environment-pages"]], "Editing an environment page": [[1, "editing-an-environment-page"]], "Adding a new environment": [[1, "adding-a-new-environment"]], "Atari env": [[1, "atari-env"]], "Non-Atari env": [[1, "non-atari-env"]], "Other steps": [[1, "other-steps"]], "Build the Documentation": [[1, "build-the-documentation"]], "Env": [[2, "env"]], "gymnasium.Env": [[2, "gymnasium-env"]], "Methods": [[2, "methods"], [4, "methods"], [10, "methods"], [11, "methods"]], "Attributes": [[2, "attributes"], [4, "attributes"], [10, "attributes"], [11, "attributes"]], "Additional Methods": [[2, "additional-methods"]], "Implementing environments": [[2, "implementing-environments"]], "Registry": [[3, "registry"]], "Make": [[3, "make"]], "Register": [[3, "register"]], "All registered environments": [[3, "all-registered-environments"]], "Spec": [[3, "spec"]], "Spaces": [[4, "spaces"], [16, "spaces"]], "Fundamental Spaces": [[4, "fundamental-spaces"], [6, "fundamental-spaces"]], "Composite Spaces": [[4, "composite-spaces"], [5, "composite-spaces"]], "Utils": [[4, "utils"], [9, "utils"]], "Vector Utils": [[4, "vector-utils"]], "Dict": [[5, "dict"]], "Tuple": [[5, "tuple"]], "Sequence": [[5, "sequence"]], "Graph": [[5, "graph"]], "Box": [[6, "box"]], "Discrete": [[6, "discrete"]], "MultiBinary": [[6, "multibinary"]], "MultiDiscrete": [[6, "multidiscrete"]], "Text": [[6, "text"]], "Spaces Utils": [[7, "spaces-utils"]], "Spaces Vector Utils": [[8, "spaces-vector-utils"]], "Shared Memory Utils": [[8, "shared-memory-utils"]], "Visualization": [[9, "visualization"]], "Save Rendering Videos": [[9, "save-rendering-videos"]], "Old to New Step API Compatibility": [[9, "old-to-new-step-api-compatibility"]], "Seeding": [[9, "seeding"]], "Environment Checking": [[9, "environment-checking"]], "Vector": [[10, "vector"]], "Gymnasium.vector.VectorEnv": [[10, "gymnasium-vector-vectorenv"]], "Making Vector Environments": [[10, "making-vector-environments"]], "Async Vector Env": [[10, "async-vector-env"]], "Sync Vector Env": [[10, "sync-vector-env"]], "Wrappers": [[11, "wrappers"], [16, "wrappers"]], "gymnasium.Wrapper": [[11, "gymnasium-wrapper"]], "Gymnasium Wrappers": [[11, "gymnasium-wrappers"]], "Implementing a custom wrapper": [[11, "implementing-a-custom-wrapper"]], "Action Wrappers": [[12, "action-wrappers"]], "Action Wrapper": [[12, "action-wrapper"]], "Clip Action": [[12, "clip-action"]], "Rescale Action": [[12, "rescale-action"]], "Misc Wrappers": [[13, "misc-wrappers"]], "Atari Preprocessing": [[13, "atari-preprocessing"]], "Autoreset": [[13, "autoreset"]], "Compatibility": [[13, "compatibility"]], "Passive Environment Checker": [[13, "passive-environment-checker"]], "Human Rendering": [[13, "human-rendering"]], "Order Enforcing": [[13, "order-enforcing"]], "Record Episode Statistics": [[13, "record-episode-statistics"]], "Record Video": [[13, "record-video"]], "Render Collection": [[13, "render-collection"]], "Time Limit": [[13, "time-limit"]], "Vector List Info": [[13, "vector-list-info"]], "Observation Wrappers": [[14, "observation-wrappers"]], "Observation Wrapper": [[14, "observation-wrapper"]], "Transform Observation": [[14, "transform-observation"]], "Filter Observation": [[14, "filter-observation"]], "Flatten Observation": [[14, "flatten-observation"]], "Framestack Observations": [[14, "framestack-observations"]], "Gray Scale Observation": [[14, "gray-scale-observation"]], "Normalize Observation": [[14, "normalize-observation"]], "Pixel Observation Wrapper": [[14, "pixel-observation-wrapper"]], "Resize Observation": [[14, "resize-observation"]], "Time Aware Observation": [[14, "time-aware-observation"]], "Reward Wrappers": [[15, "reward-wrappers"]], "Reward Wrapper": [[15, "reward-wrapper"]], "Transform Reward": [[15, "transform-reward"]], "Normalize Reward": [[15, "normalize-reward"]], "Basic Usage": [[16, "basic-usage"]], "Initializing Environments": [[16, "initializing-environments"]], "Interacting with the Environment": [[16, "interacting-with-the-environment"]], "Change in env.step API": [[16, "change-in-env-step-api"]], "Backward compatibility": [[16, "backward-compatibility"]], "Checking API-Conformity": [[16, "checking-api-conformity"]], "Playing within an environment": [[16, "playing-within-an-environment"]], "Make your own custom environment": [[17, "make-your-own-custom-environment"]], "Subclassing gymnasium.Env": [[17, "subclassing-gymnasium-env"]], "Declaration and Initialization": [[17, "declaration-and-initialization"]], "Constructing Observations From Environment States": [[17, "constructing-observations-from-environment-states"]], "Reset": [[17, "reset"]], "Step": [[17, "step"]], "Rendering": [[17, "rendering"]], "Close": [[17, "close"]], "Registering Envs": [[17, "registering-envs"]], "Creating a Package": [[17, "creating-a-package"]], "Creating Environment Instances": [[17, "creating-environment-instances"]], "Using Wrappers": [[17, "using-wrappers"]], "Compatibility with Gym": [[18, "compatibility-with-gym"]], "Loading OpenAI Gym environments": [[18, "loading-openai-gym-environments"]], "< v0.22 Environment Compatibility": [[18, "v0-22-environment-compatibility"]], "Step API Compatibility": [[18, "step-api-compatibility"]], "Handling Time Limits": [[19, "handling-time-limits"]], "Termination": [[19, "termination"]], "Truncation": [[19, "truncation"]], "Importance in learning code": [[19, "importance-in-learning-code"]], "Solution": [[19, "solution"]], "Vectorizing your environments": [[20, "vectorizing-your-environments"]], "Vectorized Environments": [[20, "vectorized-environments"]], "Creating a vectorized environment": [[20, "creating-a-vectorized-environment"]], "Working with vectorized environments": [[20, "working-with-vectorized-environments"]], "Observation & Action spaces": [[20, "observation-action-spaces"]], "Intermediate Usage": [[20, "intermediate-usage"]], "Shared memory": [[20, "shared-memory"]], "Exception handling": [[20, "exception-handling"]], "Advanced Usage": [[20, "advanced-usage"]], "Custom spaces": [[20, "custom-spaces"]], "Atari": [[21, "atari"]], "AutoROM (installing the ROMs)": [[21, "autorom-installing-the-roms"]], "Action Space": [[21, "action-space"], [47, "action-space"], [48, "action-space"], [49, "action-space"], [50, "action-space"], [51, "action-space"], [85, "action-space"], [86, "action-space"], [87, "action-space"], [89, "action-space"], [90, "action-space"], [91, "action-space"], [92, "action-space"], [93, "action-space"], [95, "action-space"], [96, "action-space"], [97, "action-space"], [98, "action-space"], [99, "action-space"], [100, "action-space"], [101, "action-space"], [102, "action-space"], [103, "action-space"], [104, "action-space"], [105, "action-space"], [108, "action-space"], [110, "action-space"]], "Observation Space": [[21, "observation-space"], [85, "observation-space"], [86, "observation-space"], [87, "observation-space"], [89, "observation-space"], [90, "observation-space"], [91, "observation-space"], [92, "observation-space"], [93, "observation-space"], [95, "observation-space"], [96, "observation-space"], [97, "observation-space"], [98, "observation-space"], [99, "observation-space"], [100, "observation-space"], [101, "observation-space"], [102, "observation-space"], [103, "observation-space"], [104, "observation-space"], [105, "observation-space"], [108, "observation-space"], [110, "observation-space"]], "Rewards": [[21, "rewards"], [24, "rewards"], [25, "rewards"], [27, "rewards"], [28, "rewards"], [29, "rewards"], [30, "rewards"], [31, "rewards"], [32, "rewards"], [33, "rewards"], [34, "rewards"], [35, "rewards"], [36, "rewards"], [37, "rewards"], [38, "rewards"], [39, "rewards"], [41, "rewards"], [42, "rewards"], [43, "rewards"], [44, "rewards"], [45, "rewards"], [46, "rewards"], [47, "rewards"], [48, "rewards"], [49, "rewards"], [50, "rewards"], [51, "rewards"], [52, "rewards"], [53, "rewards"], [54, "rewards"], [55, "rewards"], [56, "rewards"], [57, "rewards"], [63, "rewards"], [64, "rewards"], [65, "rewards"], [66, "rewards"], [67, "rewards"], [68, "rewards"], [69, "rewards"], [70, "rewards"], [71, "rewards"], [72, "rewards"], [73, "rewards"], [74, "rewards"], [75, "rewards"], [76, "rewards"], [77, "rewards"], [85, "rewards"], [86, "rewards"], [87, "rewards"], [89, "rewards"], [90, "rewards"], [93, "rewards"], [95, "rewards"], [96, "rewards"], [97, "rewards"], [98, "rewards"], [99, "rewards"], [100, "rewards"], [101, "rewards"], [102, "rewards"], [103, "rewards"], [104, "rewards"], [105, "rewards"], [108, "rewards"], [110, "rewards"], [111, "rewards"]], "Stochasticity": [[21, "stochasticity"]], "Common Arguments": [[21, "common-arguments"]], "Version History and Naming Schemes": [[21, "version-history-and-naming-schemes"]], "Flavors": [[21, "flavors"]], "References": [[21, "references"], [86, "references"], [89, "references"]], "Adventure": [[22, "adventure"]], "Description": [[22, "description"], [23, "description"], [24, "description"], [25, "description"], [26, "description"], [27, "description"], [28, "description"], [29, "description"], [30, "description"], [31, "description"], [32, "description"], [33, "description"], [34, "description"], [35, "description"], [36, "description"], [37, "description"], [38, "description"], [39, "description"], [41, "description"], [42, "description"], [43, "description"], [44, "description"], [45, "description"], [46, "description"], [47, "description"], [48, "description"], [49, "description"], [50, "description"], [51, "description"], [52, "description"], [53, "description"], [54, "description"], [55, "description"], [56, "description"], [57, "description"], [58, "description"], [59, "description"], [60, "description"], [61, "description"], [62, "description"], [63, "description"], [64, "description"], [65, "description"], [66, "description"], [67, "description"], [68, "description"], [69, "description"], [70, "description"], [71, "description"], [72, "description"], [73, "description"], [74, "description"], [75, "description"], [76, "description"], [77, "description"], [78, "description"], [79, "description"], [80, "description"], [81, "description"], [82, "description"], [83, "description"], [85, "description"], [86, "description"], [87, "description"], [89, "description"], [90, "description"], [91, "description"], [92, "description"], [93, "description"], [95, "description"], [96, "description"], [97, "description"], [98, "description"], [99, "description"], [100, "description"], [101, "description"], [102, "description"], [103, "description"], [104, "description"], [105, "description"], [108, "description"], [109, "description"], [111, "description"]], "Actions": [[22, "actions"], [23, "actions"], [24, "actions"], [25, "actions"], [26, "actions"], [27, "actions"], [28, "actions"], [29, "actions"], [30, "actions"], [31, "actions"], [32, "actions"], [33, "actions"], [34, "actions"], [35, "actions"], [36, "actions"], [37, "actions"], [38, "actions"], [39, "actions"], [41, "actions"], [42, "actions"], [43, "actions"], [44, "actions"], [45, "actions"], [46, "actions"], [52, "actions"], [53, "actions"], [54, "actions"], [55, "actions"], [56, "actions"], [57, "actions"], [58, "actions"], [59, "actions"], [60, "actions"], [61, "actions"], [62, "actions"], [63, "actions"], [64, "actions"], [65, "actions"], [66, "actions"], [67, "actions"], [68, "actions"], [69, "actions"], [70, "actions"], [71, "actions"], [72, "actions"], [73, "actions"], [74, "actions"], [75, "actions"], [76, "actions"], [77, "actions"], [78, "actions"], [79, "actions"], [80, "actions"], [81, "actions"], [82, "actions"], [83, "actions"], [109, "actions"], [111, "actions"]], "Observations": [[22, "observations"], [23, "observations"], [24, "observations"], [25, "observations"], [26, "observations"], [27, "observations"], [28, "observations"], [29, "observations"], [30, "observations"], [31, "observations"], [32, "observations"], [33, "observations"], [34, "observations"], [35, "observations"], [36, "observations"], [37, "observations"], [38, "observations"], [39, "observations"], [41, "observations"], [42, "observations"], [43, "observations"], [44, "observations"], [45, "observations"], [46, "observations"], [47, "observations"], [48, "observations"], [49, "observations"], [50, "observations"], [51, "observations"], [52, "observations"], [53, "observations"], [54, "observations"], [55, "observations"], [56, "observations"], [57, "observations"], [58, "observations"], [59, "observations"], [60, "observations"], [61, "observations"], [62, "observations"], [63, "observations"], [64, "observations"], [65, "observations"], [66, "observations"], [67, "observations"], [68, "observations"], [69, "observations"], [70, "observations"], [71, "observations"], [72, "observations"], [73, "observations"], [74, "observations"], [75, "observations"], [76, "observations"], [77, "observations"], [78, "observations"], [79, "observations"], [80, "observations"], [81, "observations"], [82, "observations"], [83, "observations"], [109, "observations"], [111, "observations"]], "Arguments": [[22, "arguments"], [23, "arguments"], [24, "arguments"], [25, "arguments"], [26, "arguments"], [27, "arguments"], [28, "arguments"], [29, "arguments"], [30, "arguments"], [31, "arguments"], [32, "arguments"], [33, "arguments"], [34, "arguments"], [35, "arguments"], [36, "arguments"], [37, "arguments"], [38, "arguments"], [39, "arguments"], [41, "arguments"], [42, "arguments"], [43, "arguments"], [44, "arguments"], [45, "arguments"], [46, "arguments"], [47, "arguments"], [48, "arguments"], [49, "arguments"], [50, "arguments"], [51, "arguments"], [52, "arguments"], [53, "arguments"], [54, "arguments"], [55, "arguments"], [56, "arguments"], [57, "arguments"], [58, "arguments"], [59, "arguments"], [60, "arguments"], [61, "arguments"], [62, "arguments"], [63, "arguments"], [64, "arguments"], [65, "arguments"], [66, "arguments"], [67, "arguments"], [68, "arguments"], [69, "arguments"], [70, "arguments"], [71, "arguments"], [72, "arguments"], [73, "arguments"], [74, "arguments"], [75, "arguments"], [76, "arguments"], [77, "arguments"], [78, "arguments"], [79, "arguments"], [80, "arguments"], [81, "arguments"], [82, "arguments"], [83, "arguments"], [85, "arguments"], [86, "arguments"], [87, "arguments"], [89, "arguments"], [90, "arguments"], [91, "arguments"], [92, "arguments"], [93, "arguments"], [95, "arguments"], [96, "arguments"], [97, "arguments"], [98, "arguments"], [99, "arguments"], [100, "arguments"], [101, "arguments"], [102, "arguments"], [103, "arguments"], [104, "arguments"], [105, "arguments"], [108, "arguments"], [109, "arguments"], [110, "arguments"], [111, "arguments"]], "Version History": [[22, "version-history"], [23, "version-history"], [24, "version-history"], [25, "version-history"], [26, "version-history"], [27, "version-history"], [28, "version-history"], [29, "version-history"], [30, "version-history"], [31, "version-history"], [32, "version-history"], [33, "version-history"], [34, "version-history"], [35, "version-history"], [36, "version-history"], [37, "version-history"], [38, "version-history"], [39, "version-history"], [41, "version-history"], [42, "version-history"], [43, "version-history"], [44, "version-history"], [45, "version-history"], [46, "version-history"], [47, "version-history"], [48, "version-history"], [49, "version-history"], [50, "version-history"], [51, "version-history"], [52, "version-history"], [53, "version-history"], [54, "version-history"], [55, "version-history"], [56, "version-history"], [57, "version-history"], [58, "version-history"], [59, "version-history"], [60, "version-history"], [61, "version-history"], [62, "version-history"], [63, "version-history"], [64, "version-history"], [65, "version-history"], [66, "version-history"], [67, "version-history"], [68, "version-history"], [69, "version-history"], [70, "version-history"], [71, "version-history"], [72, "version-history"], [73, "version-history"], [74, "version-history"], [75, "version-history"], [76, "version-history"], [77, "version-history"], [78, "version-history"], [79, "version-history"], [80, "version-history"], [81, "version-history"], [82, "version-history"], [83, "version-history"], [85, "version-history"], [86, "version-history"], [87, "version-history"], [89, "version-history"], [91, "version-history"], [92, "version-history"], [93, "version-history"], [95, "version-history"], [96, "version-history"], [97, "version-history"], [98, "version-history"], [99, "version-history"], [100, "version-history"], [101, "version-history"], [102, "version-history"], [103, "version-history"], [104, "version-history"], [105, "version-history"], [108, "version-history"], [109, "version-history"], [110, "version-history"], [111, "version-history"]], "Air Raid": [[23, "air-raid"]], "Alien": [[24, "alien"]], "Amidar": [[25, "amidar"]], "Assault": [[26, "assault"]], "Asterix": [[27, "asterix"]], "Asteroids": [[28, "asteroids"]], "Atlantis": [[29, "atlantis"]], "Bank Heist": [[30, "bank-heist"]], "Battle Zone": [[31, "battle-zone"]], "Beam Rider": [[32, "beam-rider"]], "Berzerk": [[33, "berzerk"]], "Bowling": [[34, "bowling"]], "Boxing": [[35, "boxing"]], "Breakout": [[36, "breakout"]], "Carnival": [[37, "carnival"]], "Centipede": [[38, "centipede"]], "Chopper Command": [[39, "chopper-command"]], "Complete List - Atari": [[40, "complete-list-atari"]], "Crazy Climber": [[41, "crazy-climber"]], "Defender": [[42, "defender"]], "Demon Attack": [[43, "demon-attack"]], "Double Dunk": [[44, "double-dunk"]], "Elevator Action": [[45, "elevator-action"]], "Enduro": [[46, "enduro"]], "FishingDerby": [[47, "fishingderby"]], "Freeway": [[48, "freeway"]], "Frostbite": [[49, "frostbite"]], "Gopher": [[50, "gopher"]], "Gravitar": [[51, "gravitar"]], "Hero": [[52, "hero"]], "IceHockey": [[53, "icehockey"]], "Jamesbond": [[54, "jamesbond"]], "JourneyEscape": [[55, "journeyescape"]], "Kangaroo": [[56, "kangaroo"]], "Krull": [[57, "krull"]], "Kung Fu Master": [[58, "kung-fu-master"]], "Montezuma Revenge": [[59, "montezuma-revenge"]], "Ms Pacman": [[60, "ms-pacman"]], "Name This Game": [[61, "name-this-game"]], "Phoenix": [[62, "phoenix"]], "Pitfall": [[63, "pitfall"]], "Pong": [[64, "pong"]], "Pooyan": [[65, "pooyan"]], "PrivateEye": [[66, "privateeye"]], "Qbert": [[67, "qbert"]], "Riverraid": [[68, "riverraid"]], "Road Runner": [[69, "road-runner"]], "Robot Tank": [[70, "robot-tank"]], "Seaquest": [[71, "seaquest"]], "Skiings": [[72, "skiings"]], "Solaris": [[73, "solaris"]], "SpaceInvaders": [[74, "spaceinvaders"]], "StarGunner": [[75, "stargunner"]], "Tennis": [[76, "tennis"]], "TimePilot": [[77, "timepilot"]], "Tutankham": [[78, "tutankham"]], "Up n\u2019 Down": [[79, "up-n-down"]], "Venture": [[80, "venture"]], "Video Pinball": [[81, "video-pinball"]], "Wizard of Wor": [[82, "wizard-of-wor"]], "Zaxxon": [[83, "zaxxon"]], "Box2D": [[84, "box2d"]], "Bipedal Walker": [[85, "bipedal-walker"]], "Starting State": [[85, "starting-state"], [86, "starting-state"], [87, "starting-state"], [89, "starting-state"], [90, "starting-state"], [91, "starting-state"], [92, "starting-state"], [93, "starting-state"], [95, "starting-state"], [96, "starting-state"], [97, "starting-state"], [98, "starting-state"], [99, "starting-state"], [100, "starting-state"], [101, "starting-state"], [102, "starting-state"], [103, "starting-state"], [104, "starting-state"], [105, "starting-state"]], "Episode Termination": [[85, "episode-termination"], [86, "episode-termination"], [87, "episode-termination"]], "Credits": [[85, "credits"], [86, "credits"], [87, "credits"]], "Car Racing": [[86, "car-racing"]], "Reset Arguments": [[86, "reset-arguments"]], "Lunar Lander": [[87, "lunar-lander"]], "Classic Control": [[88, "classic-control"]], "Acrobot": [[89, "acrobot"]], "Episode End": [[89, "episode-end"], [90, "episode-end"], [91, "episode-end"], [92, "episode-end"], [95, "episode-end"], [96, "episode-end"], [97, "episode-end"], [98, "episode-end"], [99, "episode-end"], [100, "episode-end"], [101, "episode-end"], [102, "episode-end"], [103, "episode-end"], [104, "episode-end"], [105, "episode-end"]], "Cart Pole": [[90, "cart-pole"]], "Mountain Car": [[91, "mountain-car"]], "Transition Dynamics:": [[91, "transition-dynamics"], [92, "transition-dynamics"]], "Reward:": [[91, "reward"]], "Mountain Car Continuous": [[92, "mountain-car-continuous"]], "Reward": [[92, "reward"], [109, "reward"]], "Pendulum": [[93, "pendulum"]], "Episode Truncation": [[93, "episode-truncation"]], "MuJoCo": [[94, "mujoco"]], "Ant": [[95, "ant"]], "Half Cheetah": [[96, "half-cheetah"]], "Hopper": [[97, "hopper"]], "Humanoid": [[98, "humanoid"]], "Humanoid Standup": [[99, "humanoid-standup"]], "Inverted Double Pendulum": [[100, "inverted-double-pendulum"]], "Inverted Pendulum": [[101, "inverted-pendulum"]], "Pusher": [[102, "pusher"]], "Reacher": [[103, "reacher"]], "Swimmer": [[104, "swimmer"]], "Notes": [[104, "notes"]], "Walker2D": [[105, "walker2d"]], "Third-Party Environments": [[106, "third-party-environments"]], "Video Game Environments": [[106, "video-game-environments"]], "ViZDoom": [[106, "vizdoom"]], " flappy-bird-gym: A Flappy Bird environment for OpenAI Gym": [[106, "flappy-bird-gym-a-flappy-bird-environment-for-openai-gym"]], " gym-derk: GPU accelerated MOBA environment": [[106, "gym-derk-gpu-accelerated-moba-environment"]], " MineRL": [[106, "minerl"]], " Procgen": [[106, "procgen"]], " SlimeVolleyGym: A simple environment for single and multi-agent reinforcement learning": [[106, "slimevolleygym-a-simple-environment-for-single-and-multi-agent-reinforcement-learning"]], " stable-retro": [[106, "stable-retro"]], " Unity ML Agents": [[106, "unity-ml-agents"]], "Classic Environments (board, card, etc. games)": [[106, "classic-environments-board-card-etc-games"]], " gym-abalone: A two-player abstract strategy board game": [[106, "gym-abalone-a-two-player-abstract-strategy-board-game"]], " gym-spoof": [[106, "gym-spoof"]], " gym-xiangqi: Xiangqi - The Chinese Chess Game": [[106, "gym-xiangqi-xiangqi-the-chinese-chess-game"]], " RubiksCubeGym": [[106, "rubikscubegym"]], " GymGo": [[106, "gymgo"]], "Robotics Environments": [[106, "robotics-environments"]], " GymFC: A flight control tuning and training framework": [[106, "gymfc-a-flight-control-tuning-and-training-framework"]], " gym-gazebo": [[106, "gym-gazebo"]], " gym-goddard: Goddard\u2019s Rocket Problem": [[106, "gym-goddard-goddard-s-rocket-problem"]], " gym-jiminy: training Robots in Jiminy": [[106, "gym-jiminy-training-robots-in-jiminy"]], " gym-miniworld": [[106, "gym-miniworld"]], " gym-pybullet-drones": [[106, "gym-pybullet-drones"]], " MarsExplorer": [[106, "marsexplorer"]], " panda-gym ": [[106, "panda-gym"]], " PyBullet Robotics Environments": [[106, "pybullet-robotics-environments"]], " robo-gym": [[106, "robo-gym"]], " Offworld-gym": [[106, "offworld-gym"]], "Autonomous Driving and Traffic Control Environments": [[106, "autonomous-driving-and-traffic-control-environments"]], " gym-carla": [[106, "gym-carla"]], " gym-duckietown": [[106, "gym-duckietown"]], " gym-electric-motor": [[106, "gym-electric-motor"]], " highway-env": [[106, "highway-env"]], " LongiControl": [[106, "longicontrol"]], " sumo-rl": [[106, "sumo-rl"]], " CommonRoad-RL": [[106, "commonroad-rl"]], "Multi-Agents": [[106, "multi-agents"]], "PettingZoo": [[106, "pettingzoo"]], "Other Environments": [[106, "other-environments"]], " anomalous_rl_envs": [[106, "anomalous-rl-envs"]], " CARL": [[106, "carl"]], " CompilerGym": [[106, "compilergym"]], " DACBench": [[106, "dacbench"]], " Gridworld": [[106, "gridworld"]], " gym-adserve": [[106, "gym-adserve"]], " gym-algorithmic": [[106, "gym-algorithmic"]], " gym-anytrading": [[106, "gym-anytrading"]], " gym-autokey": [[106, "gym-autokey"]], " gym-ccc": [[106, "gym-ccc"]], " gym-cellular-automata": [[106, "gym-cellular-automata"]], " gym-games": [[106, "gym-games"]], " gym-inventory": [[106, "gym-inventory"]], " gym-maze": [[106, "gym-maze"]], " gym-mtsim": [[106, "gym-mtsim"]], " gym-legacy-toytext": [[106, "gym-legacy-toytext"]], " gym-riverswim": [[106, "gym-riverswim"]], " gym-recsys": [[106, "gym-recsys"]], " gym-sokoban": [[106, "gym-sokoban"]], " math-prog-synth-env": [[106, "math-prog-synth-env"]], " NASGym": [[106, "nasgym"]], " NLPGym: A toolkit to develop RL agents to solve NLP tasks": [[106, "nlpgym-a-toolkit-to-develop-rl-agents-to-solve-nlp-tasks"]], " Obstacle Tower": [[106, "obstacle-tower"]], " openmodelica-microgrid-gym": [[106, "openmodelica-microgrid-gym"]], " osim-rl": [[106, "osim-rl"]], " PGE: Parallel Game Engine": [[106, "pge-parallel-game-engine"]], " QASGym": [[106, "qasgym"]], " safe-control-gym": [[106, "safe-control-gym"]], " VirtualTaobao": [[106, "virtualtaobao"]], " mo-gym": [[106, "mo-gym"]], "ABIDES-Gym": [[106, "abides-gym"]], "gym-saturation": [[106, "gym-saturation"]], "ShinRL": [[106, "shinrl"]], "racing-rl": [[106, "racing-rl"]], "go-explore": [[106, "go-explore"]], "tmrl": [[106, "tmrl"]], "racing_dreamer": [[106, "racing-dreamer"]], "racecar_gym": [[106, "racecar-gym"]], "jiminy": [[106, "jiminy"]], "evogym-design-tool": [[106, "evogym-design-tool"]], "l2r": [[106, "l2r"]], "gym_torcs": [[106, "gym-torcs"]], "mobile-env": [[106, "mobile-env"]], "gym-softrobot": [[106, "gym-softrobot"]], "PyElastica": [[106, "pyelastica"]], "tuxkart-ai": [[106, "tuxkart-ai"]], "ostrichrl": [[106, "ostrichrl"]], "quadruped-gym": [[106, "quadruped-gym"]], "Pogo-Stick-Jumping": [[106, "pogo-stick-jumping"]], "evogym": [[106, "evogym"]], "iGibson": [[106, "igibson"]], "SnakeRL": [[106, "snakerl"]], "starship-landing-gym": [[106, "starship-landing-gym"]], "CompilerGym": [[106, "id1"]], "RaveForce": [[106, "raveforce"]], "gym-line-follower": [[106, "gym-line-follower"]], "DexterousHands": [[106, "dexteroushands"]], "OmniIsaacGymEnvs": [[106, "omniisaacgymenvs"]], "border": [[106, "border"]], "SpaceRobotEnv": [[106, "spacerobotenv"]], "gymnax": [[106, "gymnax"]], "Toy Text": [[107, "toy-text"]], "Blackjack": [[108, "blackjack"]], "Cliff Walking": [[109, "cliff-walking"]], "Frozen Lake": [[110, "frozen-lake"]], "Taxi": [[111, "taxi"]], "Info": [[111, "info"]], "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments": [[112, "gymnasium-is-a-standard-api-for-reinforcement-learning-and-a-diverse-collection-of-reference-environments"]]}, "indexentries": {"env (class in gymnasium)": [[2, "gymnasium.Env"]], "action_space (gymnasium.env attribute)": [[2, "gymnasium.Env.action_space"]], "close() (in module gymnasium.env)": [[2, "gymnasium.Env.close"]], "metadata (gymnasium.env attribute)": [[2, "gymnasium.Env.metadata"]], "np_random (gymnasium.env property)": [[2, "gymnasium.Env.np_random"]], "observation_space (gymnasium.env attribute)": [[2, "gymnasium.Env.observation_space"]], "render() (in module gymnasium.env)": [[2, "gymnasium.Env.render"]], "render_mode (gymnasium.env attribute)": [[2, "gymnasium.Env.render_mode"]], "reset() (in module gymnasium.env)": [[2, "gymnasium.Env.reset"]], "reward_range (gymnasium.env attribute)": [[2, "gymnasium.Env.reward_range"]], "spec (gymnasium.env attribute)": [[2, "gymnasium.Env.spec"]], "step() (in module gymnasium.env)": [[2, "gymnasium.Env.step"]], "unwrapped (gymnasium.env property)": [[2, "gymnasium.Env.unwrapped"]], "make() (in module gymnasium)": [[3, "gymnasium.make"]], "register() (in module gymnasium)": [[3, "gymnasium.register"]], "spec() (in module gymnasium)": [[3, "gymnasium.spec"]], "space (class in gymnasium.spaces)": [[4, "gymnasium.spaces.Space"]], "contains() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.contains"]], "dtype (space property)": [[4, "Space.dtype"]], "from_jsonable() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.from_jsonable"]], "sample() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.sample"]], "seed() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.seed"]], "shape (gymnasium.spaces.space.space property)": [[4, "gymnasium.spaces.space.Space.shape"]], "to_jsonable() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.to_jsonable"]], "dict (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Dict"]], "graph (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Graph"]], "sequence (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Sequence"]], "tuple (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Tuple"]], "sample() (gymnasium.spaces.dict method)": [[5, "gymnasium.spaces.Dict.sample"]], "sample() (gymnasium.spaces.graph method)": [[5, "gymnasium.spaces.Graph.sample"]], "sample() (gymnasium.spaces.sequence method)": [[5, "gymnasium.spaces.Sequence.sample"]], "sample() (gymnasium.spaces.tuple method)": [[5, "gymnasium.spaces.Tuple.sample"]], "seed() (gymnasium.spaces.dict method)": [[5, "gymnasium.spaces.Dict.seed"]], "seed() (gymnasium.spaces.graph method)": [[5, "gymnasium.spaces.Graph.seed"]], "seed() (gymnasium.spaces.sequence method)": [[5, "gymnasium.spaces.Sequence.seed"]], "seed() (gymnasium.spaces.tuple method)": [[5, "gymnasium.spaces.Tuple.seed"]], "box (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Box"]], "discrete (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Discrete"]], "multibinary (class in gymnasium.spaces)": [[6, "gymnasium.spaces.MultiBinary"]], "multidiscrete (class in gymnasium.spaces)": [[6, "gymnasium.spaces.MultiDiscrete"]], "text (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Text"]], "is_bounded() (gymnasium.spaces.box method)": [[6, "gymnasium.spaces.Box.is_bounded"]], "sample() (gymnasium.spaces.box method)": [[6, "gymnasium.spaces.Box.sample"]], "sample() (gymnasium.spaces.discrete method)": [[6, "gymnasium.spaces.Discrete.sample"]], "sample() (gymnasium.spaces.multibinary method)": [[6, "gymnasium.spaces.MultiBinary.sample"]], "sample() (gymnasium.spaces.multidiscrete method)": [[6, "gymnasium.spaces.MultiDiscrete.sample"]], "sample() (gymnasium.spaces.text method)": [[6, "gymnasium.spaces.Text.sample"]], "seed() (gymnasium.spaces.box method)": [[6, "gymnasium.spaces.Box.seed"]], "seed() (gymnasium.spaces.discrete method)": [[6, "gymnasium.spaces.Discrete.seed"]], "seed() (gymnasium.spaces.multibinary method)": [[6, "gymnasium.spaces.MultiBinary.seed"]], "seed() (gymnasium.spaces.multidiscrete method)": [[6, "gymnasium.spaces.MultiDiscrete.seed"]], "seed() (gymnasium.spaces.text method)": [[6, "gymnasium.spaces.Text.seed"]], "flatdim() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.flatdim"]], "flatten() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.flatten"]], "flatten_space() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.flatten_space"]], "unflatten() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.unflatten"]], "batch_space() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.batch_space"]], "concatenate() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.concatenate"]], "create_empty_array() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.create_empty_array"]], "create_shared_memory() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.create_shared_memory"]], "iterate() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.iterate"]], "read_from_shared_memory() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.read_from_shared_memory"]], "write_to_shared_memory() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.write_to_shared_memory"]], "playplot (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayPlot"]], "playablegame (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayableGame"]], "callback() (gymnasium.utils.play.playplot method)": [[9, "gymnasium.utils.play.PlayPlot.callback"]], "capped_cubic_video_schedule() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.capped_cubic_video_schedule"]], "check_env() (in module gymnasium.utils.env_checker)": [[9, "gymnasium.utils.env_checker.check_env"]], "convert_to_done_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_done_step_api"]], "convert_to_terminated_truncated_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_terminated_truncated_step_api"]], "np_random() (in module gymnasium.utils.seeding)": [[9, "gymnasium.utils.seeding.np_random"]], "play() (in module gymnasium.utils.play)": [[9, "gymnasium.utils.play.play"]], "process_event() (gymnasium.utils.play.playablegame method)": [[9, "gymnasium.utils.play.PlayableGame.process_event"]], "save_video() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.save_video"]], "step_api_compatibility() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.step_api_compatibility"]], "asyncvectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.AsyncVectorEnv"]], "syncvectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.SyncVectorEnv"]], "vectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.VectorEnv"]], "action_space": [[10, "action_space"]], "close() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.close"]], "make() (in module gymnasium.vector)": [[10, "gymnasium.vector.make"]], "observation_space": [[10, "observation_space"]], "reset() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.reset"]], "single_action_space": [[10, "single_action_space"]], "single_observation_space": [[10, "single_observation_space"]], "step() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.step"]], "wrapper (class in gymnasium)": [[11, "gymnasium.Wrapper"]], "action_space (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.action_space"]], "close() (in module gymnasium.wrapper)": [[11, "gymnasium.Wrapper.close"]], "metadata (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.metadata"]], "np_random (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.np_random"]], "observation_space (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.observation_space"]], "reset() (in module gymnasium.wrapper)": [[11, "gymnasium.Wrapper.reset"]], "reward_range (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.reward_range"]], "spec (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.spec"]], "step() (in module gymnasium.wrapper)": [[11, "gymnasium.Wrapper.step"]], "unwrapped (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.unwrapped"]], "actionwrapper (class in gymnasium)": [[12, "gymnasium.ActionWrapper"]], "actionwrapper.action() (in module gymnasium.actionwrapper)": [[12, "gymnasium.ActionWrapper.ActionWrapper.action"]], "clipaction (class in gymnasium.wrappers)": [[12, "gymnasium.wrappers.ClipAction"]], "rescaleaction (class in gymnasium.wrappers)": [[12, "gymnasium.wrappers.RescaleAction"]], "ataripreprocessing (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.AtariPreprocessing"]], "autoresetwrapper (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.AutoResetWrapper"]], "envcompatibility (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.EnvCompatibility"]], "humanrendering (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.HumanRendering"]], "orderenforcing (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.OrderEnforcing"]], "passiveenvchecker (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.PassiveEnvChecker"]], "recordepisodestatistics (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.RecordEpisodeStatistics"]], "recordvideo (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.RecordVideo"]], "rendercollection (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.RenderCollection"]], "stepapicompatibility (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.StepAPICompatibility"]], "timelimit (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.TimeLimit"]], "vectorlistinfo (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.VectorListInfo"]], "filterobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.FilterObservation"]], "flattenobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.FlattenObservation"]], "framestack (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.FrameStack"]], "grayscaleobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.GrayScaleObservation"]], "normalizeobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.NormalizeObservation"]], "observationwrapper (class in gymnasium)": [[14, "gymnasium.ObservationWrapper"]], "pixelobservationwrapper (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.PixelObservationWrapper"]], "resizeobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.ResizeObservation"]], "timeawareobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.TimeAwareObservation"]], "transformobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.TransformObservation"]], "observation() (in module gymnasium.observationwrapper)": [[14, "gymnasium.ObservationWrapper.observation"]], "normalizereward (class in gymnasium.wrappers)": [[15, "gymnasium.wrappers.NormalizeReward"]], "rewardwrapper (class in gymnasium)": [[15, "gymnasium.RewardWrapper"]], "rewardwrapper.reward() (in module gymnasium.rewardwrapper)": [[15, "gymnasium.RewardWrapper.RewardWrapper.reward"]], "transformreward (class in gymnasium.wrappers)": [[15, "gymnasium.wrappers.TransformReward"]]}})