Search.setIndex({"docnames": ["404", "README", "api/env", "api/registry", "api/spaces", "api/spaces/composite", "api/spaces/fundamental", "api/spaces/utils", "api/spaces/vector_utils", "api/utils", "api/vector", "api/wrappers", "api/wrappers/action_wrappers", "api/wrappers/misc_wrappers", "api/wrappers/observation_wrappers", "api/wrappers/reward_wrappers", "content/basic_usage", "content/gym_compatibility", "content/migration-guide", "environments/atari", "environments/atari/adventure", "environments/atari/air_raid", "environments/atari/alien", "environments/atari/amidar", "environments/atari/assault", "environments/atari/asterix", "environments/atari/asteroids", "environments/atari/atlantis", "environments/atari/bank_heist", "environments/atari/battle_zone", "environments/atari/beam_rider", "environments/atari/berzerk", "environments/atari/bowling", "environments/atari/boxing", "environments/atari/breakout", "environments/atari/carnival", "environments/atari/centipede", "environments/atari/chopper_command", "environments/atari/crazy_climber", "environments/atari/defender", "environments/atari/demon_attack", "environments/atari/double_dunk", "environments/atari/elevator_action", "environments/atari/enduro", "environments/atari/fishing_derby", "environments/atari/freeway", "environments/atari/frostbite", "environments/atari/gopher", "environments/atari/gravitar", "environments/atari/hero", "environments/atari/ice_hockey", "environments/atari/jamesbond", "environments/atari/journey_escape", "environments/atari/kangaroo", "environments/atari/krull", "environments/atari/kung_fu_master", "environments/atari/montezuma_revenge", "environments/atari/ms_pacman", "environments/atari/name_this_game", "environments/atari/phoenix", "environments/atari/pitfall", "environments/atari/pong", "environments/atari/pooyan", "environments/atari/private_eye", "environments/atari/qbert", "environments/atari/riverraid", "environments/atari/road_runner", "environments/atari/robotank", "environments/atari/seaquest", "environments/atari/skiing", "environments/atari/solaris", "environments/atari/space_invaders", "environments/atari/star_gunner", "environments/atari/tennis", "environments/atari/time_pilot", "environments/atari/tutankham", "environments/atari/up_n_down", "environments/atari/venture", "environments/atari/video_pinball", "environments/atari/wizard_of_wor", "environments/atari/zaxxon", "environments/box2d", "environments/classic_control", "environments/mujoco", "environments/third_party_environments", "environments/toy_text", "index", "tutorials/blackjack_tutorial", "tutorials/environment_creation", "tutorials/handling_time_limits"], "filenames": ["404.md", "README.md", "api/env.md", "api/registry.md", "api/spaces.md", "api/spaces/composite.md", "api/spaces/fundamental.md", "api/spaces/utils.md", "api/spaces/vector_utils.md", "api/utils.md", "api/vector.md", "api/wrappers.md", "api/wrappers/action_wrappers.md", "api/wrappers/misc_wrappers.md", "api/wrappers/observation_wrappers.md", "api/wrappers/reward_wrappers.md", "content/basic_usage.md", "content/gym_compatibility.md", "content/migration-guide.md", "environments/atari.md", "environments/atari/adventure.md", "environments/atari/air_raid.md", "environments/atari/alien.md", "environments/atari/amidar.md", "environments/atari/assault.md", "environments/atari/asterix.md", "environments/atari/asteroids.md", "environments/atari/atlantis.md", "environments/atari/bank_heist.md", "environments/atari/battle_zone.md", "environments/atari/beam_rider.md", "environments/atari/berzerk.md", "environments/atari/bowling.md", "environments/atari/boxing.md", "environments/atari/breakout.md", "environments/atari/carnival.md", "environments/atari/centipede.md", "environments/atari/chopper_command.md", "environments/atari/crazy_climber.md", "environments/atari/defender.md", "environments/atari/demon_attack.md", "environments/atari/double_dunk.md", "environments/atari/elevator_action.md", "environments/atari/enduro.md", "environments/atari/fishing_derby.md", "environments/atari/freeway.md", "environments/atari/frostbite.md", "environments/atari/gopher.md", "environments/atari/gravitar.md", "environments/atari/hero.md", "environments/atari/ice_hockey.md", "environments/atari/jamesbond.md", "environments/atari/journey_escape.md", "environments/atari/kangaroo.md", "environments/atari/krull.md", "environments/atari/kung_fu_master.md", "environments/atari/montezuma_revenge.md", "environments/atari/ms_pacman.md", "environments/atari/name_this_game.md", "environments/atari/phoenix.md", "environments/atari/pitfall.md", "environments/atari/pong.md", "environments/atari/pooyan.md", "environments/atari/private_eye.md", "environments/atari/qbert.md", "environments/atari/riverraid.md", "environments/atari/road_runner.md", "environments/atari/robotank.md", "environments/atari/seaquest.md", "environments/atari/skiing.md", "environments/atari/solaris.md", "environments/atari/space_invaders.md", "environments/atari/star_gunner.md", "environments/atari/tennis.md", "environments/atari/time_pilot.md", "environments/atari/tutankham.md", "environments/atari/up_n_down.md", "environments/atari/venture.md", "environments/atari/video_pinball.md", "environments/atari/wizard_of_wor.md", "environments/atari/zaxxon.md", "environments/box2d.md", "environments/classic_control.md", "environments/mujoco.md", "environments/third_party_environments.md", "environments/toy_text.md", "index.md", "tutorials/blackjack_tutorial.rst", "tutorials/environment_creation.rst", "tutorials/handling_time_limits.rst"], "titles": ["404 - Page Not Found", "Gymnasium-docs", "Env", "Registry", "Spaces", "Composite Spaces", "Fundamental Spaces", "Spaces Utils", "Spaces Vector Utils", "Utils", "Vector", "Wrappers", "Action Wrappers", "Misc Wrappers", "Observation Wrappers", "Reward Wrappers", "Basic Usage", "Compatibility with Gym", "v21 to v26 Migration Guide", "Atari", "Adventure", "Air Raid", "Alien", "Amidar", "Assault", "Asterix", "Asteroids", "Atlantis", "Bank Heist", "Battle Zone", "Beam Rider", "Berzerk", "Bowling", "Boxing", "Breakout", "Carnival", "Centipede", "Chopper Command", "Crazy Climber", "Defender", "Demon Attack", "Double Dunk", "Elevator Action", "Enduro", "FishingDerby", "Freeway", "Frostbite", "Gopher", "Gravitar", "Hero", "IceHockey", "Jamesbond", "JourneyEscape", "Kangaroo", "Krull", "Kung Fu Master", "Montezuma Revenge", "Ms Pacman", "Name This Game", "Phoenix", "Pitfall", "Pong", "Pooyan", "PrivateEye", "Qbert", "Riverraid", "Road Runner", "Robot Tank", "Seaquest", "Skiings", "Solaris", "SpaceInvaders", "StarGunner", "Tennis", "TimePilot", "Tutankham", "Up n\u2019 Down", "Venture", "Video Pinball", "Wizard of Wor", "Zaxxon", "Box2D", "Classic Control", "MuJoCo", "Third-Party Environments", "Toy Text", "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments", "Solving Blackjack with Q-Learning", "Make your own custom environment", "Handling Time Limits"], "terms": {"thi": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 87, 88, 89], "folder": [1, 9, 13], "contain": [1, 2, 4, 7, 8, 10, 11, 13, 14, 16, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 87, 88], "If": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 25, 28, 33, 36, 44, 45, 46, 47, 48, 62, 69, 73, 87, 88], "you": [1, 2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 87, 88, 89], "ar": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 87, 88, 89], "pleas": [1, 2, 9, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "pr": [1, 18, 84], "repo": [1, 19, 84], "otherwis": [1, 2, 3, 5, 6, 9, 10, 13, 14, 19, 32, 84], "follow": [1, 3, 4, 9, 11, 12, 13, 15, 16, 19, 32, 41, 43, 44, 45, 46, 47, 48, 73, 87, 88, 89], "below": [1, 6, 11, 16, 44, 87, 89], "directli": [1, 5, 11, 13, 16, 84, 87, 88], "markdown": 1, "file": [1, 83, 88], "repositori": [1, 11, 83, 84], "fork": [1, 18, 84, 86], "docstr": 1, "": [1, 2, 5, 6, 9, 10, 11, 12, 13, 14, 15, 16, 19, 38, 44, 45, 46, 47, 48, 50, 51, 54, 55, 56, 61, 62, 64, 81, 82, 85, 86, 87, 88, 89], "python": [1, 3, 8, 13, 16, 84, 85, 86, 87, 88, 89], "Then": [1, 11, 12, 16, 68], "pip": [1, 19, 81, 82, 83, 88], "instal": [1, 9, 13, 27, 81, 82, 83, 88], "your": [1, 2, 10, 11, 12, 13, 14, 15, 16, 22, 23, 25, 27, 28, 30, 32, 33, 34, 36, 41, 43, 44, 45, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 61, 63, 64, 65, 66, 67, 68, 69, 70, 71, 74, 75, 76, 77, 78, 79, 80, 87], "run": [1, 2, 3, 10, 13, 28, 49, 52, 60, 65, 66, 69, 70, 84, 88], "script": [1, 87], "gen_md": 1, "py": [1, 8, 19, 83, 87, 88, 89], "automat": [1, 2, 3, 10, 11, 13, 18, 84, 88], "gener": [1, 2, 4, 5, 6, 9, 10, 11, 13, 14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 86, 88], "For": [1, 2, 6, 7, 9, 11, 13, 14, 16, 17, 18, 19, 20, 22, 23, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 39, 49, 50, 51, 52, 53, 54, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 83, 87, 88], "add": [1, 3, 9, 10, 14, 16, 83, 84, 87, 88], "complet": [1, 11, 13, 16, 18, 19, 38, 51, 63, 64, 87, 89], "ensur": [1, 2, 3, 5, 7, 9, 16, 87, 88], "i": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 83, 84, 87, 88, 89], "ha": [1, 2, 4, 6, 7, 9, 11, 13, 14, 15, 16, 18, 19, 48, 68, 82, 83, 84, 86, 87, 88, 89], "properli": [1, 4], "format": [1, 4, 9, 11, 13, 14, 16], "md": [1, 88], "correspond": [1, 2, 3, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 83, 84, 88], "gif": 1, "_static": 1, "video": [1, 11, 67], "env_typ": 1, "where": [1, 3, 5, 6, 7, 9, 11, 13, 14, 16, 18, 19, 41, 83, 84, 87, 88, 89], "categori": 1, "e": [1, 2, 4, 6, 7, 8, 10, 11, 13, 14, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 87, 88], "g": [1, 2, 4, 6, 7, 8, 10, 11, 69, 84, 88], "mujoco": [1, 11, 16, 84], "snake_cas": 1, "name": [1, 3, 11, 88], "convent": [1, 2, 19], "altern": [1, 19, 84], "gen_gif": 1, "index": [1, 8, 9, 13, 14, 16, 19], "toctre": 1, "requir": [1, 2, 4, 14, 18, 83, 84, 87], "packag": [1, 13, 84], "r": [1, 6, 13, 15, 67], "txt": 1, "To": [1, 3, 8, 10, 13, 14, 15, 16, 18, 19, 27, 37, 64, 87, 88], "onc": [1, 13, 26, 36, 42, 49, 87, 88], "cd": [1, 88], "make": [1, 2, 5, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 83, 86, 87], "dirhtml": 1, "_build": 1, "rebuild": [1, 27], "everi": [1, 9, 13, 16, 36, 37, 40, 45, 67, 68, 77, 84, 88], "time": [1, 2, 3, 5, 9, 10, 11, 18, 19, 35, 40, 41, 42, 46, 50, 52, 53, 60, 64, 65, 66, 67, 68, 69, 84, 87, 88], "chang": [1, 2, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 46, 54, 64, 83, 84, 87, 88], "made": 1, "sphinx": 1, "autobuild": 1, "b": [1, 6], "we": [1, 2, 6, 13, 14, 15, 16, 18, 19, 84, 87, 88, 89], "us": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87, 89], "galleri": 1, "insid": [1, 5, 6, 13, 88], "directori": 1, "check": [1, 2, 6, 13, 87, 88], "demo": 1, "see": [1, 2, 4, 9, 10, 16, 18, 19, 20, 23, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 39, 49, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 84, 87, 88], "exampl": [1, 2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 84, 87, 88, 89], "more": [1, 2, 4, 5, 6, 9, 10, 11, 14, 18, 19, 20, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 39, 44, 49, 50, 51, 52, 53, 54, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 83, 84, 87, 88, 89], "inform": [1, 2, 4, 5, 6, 9, 10, 11, 13, 14, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 87, 88, 89], "convert": [1, 3, 4, 5, 11, 13, 14, 17, 84, 87], "jupyer": 1, "notebook": [1, 87, 88, 89], "can": [1, 2, 3, 4, 5, 6, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 87, 88], "want": [1, 2, 5, 10, 11, 12, 13, 15, 16, 28, 49, 88], "execut": [1, 9, 12, 19, 41, 84, 88], "which": [1, 2, 3, 4, 5, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 38, 40, 42, 56, 83, 84, 88, 89], "output": [1, 8, 9, 13, 16, 87], "plot": [1, 9, 87], "should": [1, 2, 4, 6, 9, 10, 13, 14, 16, 18, 87, 88], "start": [1, 2, 4, 6, 9, 10, 13, 29, 41, 42, 48, 52, 53, 68, 84, 87], "run_": 1, "note": [1, 4, 8, 13, 87, 89], "so": [1, 9, 10, 11, 13, 14, 16, 19, 46, 69, 82, 84, 87, 88, 89], "sure": [1, 2, 13, 88], "doesn": [1, 2, 3, 11, 13, 19, 87, 89], "t": [1, 2, 3, 5, 6, 7, 9, 11, 13, 14, 15, 18, 19, 35, 44, 45, 46, 47, 48, 67, 68, 87, 88, 89], "take": [1, 2, 3, 6, 7, 9, 10, 11, 12, 13, 16, 19, 71, 82, 84, 87], "than": [1, 18, 44, 50, 68, 84, 87], "few": 1, "second": [1, 5, 9, 10, 18, 32, 62, 69, 84], "class": [2, 4, 5, 6, 9, 10, 11, 12, 13, 14, 15, 16, 83, 87, 88], "The": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 86, 87, 88, 89], "main": 2, "reinforc": [2, 4, 16, 85, 87, 89], "learn": [2, 4, 5, 13, 14, 15, 16, 19, 44, 45, 46, 47, 48, 85, 88], "agent": [2, 4, 11, 13, 14, 16, 18, 19, 42, 51, 88, 89], "encapsul": 2, "an": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 88, 89], "arbitrari": [2, 3, 6, 9, 14, 15, 84], "behind": [2, 62], "scene": [2, 62, 84], "dynam": [2, 19, 34, 44, 45, 46, 47, 48, 83, 84], "through": [2, 3, 4, 10, 18, 19, 34, 49, 52, 55, 56, 60, 69, 70, 84, 89], "step": [2, 3, 10, 11, 12, 13, 14, 15, 16, 19, 84, 86, 87, 88, 89], "reset": [2, 3, 9, 10, 11, 12, 13, 14, 15, 16, 84, 86, 87, 88], "function": [2, 3, 4, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 84, 86, 87, 89], "partial": 2, "fulli": [2, 84], "observ": [2, 4, 5, 8, 9, 10, 11, 12, 13, 15, 18, 84, 86, 88, 89], "singl": [2, 4, 5, 6, 7, 8, 9, 10, 14, 16, 88], "multi": [2, 6, 83], "pettingzoo": 2, "api": [2, 11, 13, 16, 18, 84, 88, 89], "user": [2, 3, 10, 16, 18, 19, 84, 86, 88], "need": [2, 3, 4, 5, 9, 11, 12, 13, 14, 16, 18, 37, 38, 43, 49, 53, 63, 68, 83, 87, 88, 89], "know": [2, 13, 16, 88], "updat": [2, 9, 13, 14, 16, 17, 18, 87, 88, 89], "action": [2, 3, 4, 5, 6, 9, 10, 11, 13, 18, 82, 84, 85, 86, 88], "return": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 87, 88, 89], "next": [2, 8, 16, 18, 38, 40, 42], "reward": [2, 3, 9, 10, 11, 13, 16, 18, 83, 84, 86, 87, 88, 89], "termin": [2, 3, 9, 10, 11, 13, 15, 16, 17, 18, 86, 87, 88], "truncat": [2, 3, 9, 10, 11, 13, 15, 16, 17, 18, 86, 87, 88], "due": [2, 18, 89], "latest": 2, "from": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 21, 35, 41, 46, 47, 50, 52, 61, 62, 74, 80, 83, 84, 87, 88, 89], "about": [2, 9, 14, 16, 63, 87, 88, 89], "metric": [2, 9, 18], "debug": [2, 4, 9, 85], "info": [2, 9, 10, 11, 14, 15, 16, 18, 86, 87, 88, 89], "initi": [2, 3, 5, 6, 10, 11, 12, 13, 14, 15, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 83, 84, 87], "state": [2, 11, 13, 14, 16, 18, 19, 82, 83, 84, 85, 87, 88, 89], "befor": [2, 3, 9, 10, 11, 12, 13, 14, 15, 18, 27, 38, 52, 63, 70, 71, 88], "call": [2, 3, 7, 9, 10, 11, 12, 13, 14, 16, 18, 19, 32, 50, 87, 88], "first": [2, 9, 10, 11, 13, 14, 16, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 83, 84, 87, 88], "episod": [2, 3, 9, 11, 14, 18, 87, 88, 89], "render": [2, 10, 11, 14, 16, 19, 81, 84, 87, 88], "help": [2, 4, 16, 22, 53, 56, 84, 87], "visualis": [2, 16], "what": [2, 4, 13, 19], "mode": [2, 10, 11, 13, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88], "human": [2, 5, 11, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 86, 88], "rgb_arrai": [2, 9, 11, 13, 14, 19, 88], "ansi": [2, 88], "text": [2, 4, 5, 7, 16, 84], "close": [2, 6, 9, 10, 11, 16, 18, 38, 63, 86, 87, 88], "import": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 86, 88], "when": [2, 4, 5, 7, 8, 9, 10, 11, 13, 14, 15, 19, 22, 35, 38, 39, 40, 42, 44, 45, 46, 47, 48, 50, 51, 65, 66, 67, 68, 71, 88, 89], "extern": [2, 18, 89], "softwar": [2, 84], "pygam": [2, 9, 18, 81, 84, 88], "databas": 2, "have": [2, 3, 6, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 25, 27, 28, 32, 34, 36, 37, 38, 39, 44, 45, 46, 47, 48, 49, 52, 53, 54, 58, 60, 62, 68, 70, 81, 84, 87, 88, 89], "understand": [2, 7, 10, 84], "action_spac": [2, 9, 10, 11, 12, 14, 15, 16, 18, 87, 88], "space": [2, 9, 10, 11, 12, 13, 14, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 83, 84, 85, 88], "object": [2, 4, 8, 11, 16, 20, 25, 38, 44, 45, 53, 65, 71, 84, 87], "valid": [2, 3, 4, 6, 8, 10, 11, 12, 13, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 87], "all": [2, 5, 6, 10, 11, 13, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 45, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 87], "within": [2, 4, 12, 14, 16, 17, 18, 56, 60, 82, 84], "observation_spac": [2, 5, 6, 10, 11, 14, 16, 88], "reward_rang": [2, 11, 15], "A": [2, 4, 5, 6, 7, 9, 10, 12, 13, 14, 15, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 87, 88, 89], "tupl": [2, 4, 6, 7, 8, 9, 11, 14, 16, 18, 19, 87, 88], "minimum": [2, 6], "maximum": [2, 3, 6, 9, 13, 16, 67, 68, 84, 88], "possibl": [2, 5, 6, 7, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 87, 88], "over": [2, 8, 13, 15, 22, 28, 50, 60, 65, 87], "default": [2, 3, 4, 5, 6, 9, 10, 11, 13, 14, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 88, 89], "rang": [2, 8, 9, 11, 12, 13, 15, 16, 17, 18, 19, 50, 82, 86, 87, 88], "set": [2, 5, 6, 10, 11, 12, 13, 14, 18, 19, 20, 21, 22, 23, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 76, 77, 78, 79, 81, 82, 83, 84, 87, 88, 89], "infti": [2, 6], "spec": [2, 10, 11, 13], "metadata": [2, 9, 11, 13, 19, 88], "fp": [2, 9, 19, 88], "np_random": [2, 9, 11, 13, 18, 88], "random": [2, 4, 5, 6, 9, 13, 14, 16, 19, 84, 87, 88], "number": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 14, 16, 17, 19, 21, 22, 23, 24, 25, 26, 27, 30, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 52, 55, 57, 58, 59, 61, 62, 64, 67, 69, 71, 72, 74, 75, 76, 78, 79, 88], "assign": [2, 69], "dure": [2, 5, 6, 10, 11, 13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88], "super": [2, 11, 12, 14, 15, 18, 88], "seed": [2, 3, 4, 5, 6, 10, 16, 66, 86, 88], "assess": 2, "self": [2, 4, 5, 11, 12, 13, 14, 15, 84, 87, 88], "modifi": [2, 4, 10, 11, 12, 14, 15, 18, 84, 88], "extend": [2, 84], "wrapper": [2, 3, 5, 6, 9, 10, 16, 17, 18, 84, 86], "acttyp": [2, 9, 11], "obstyp": [2, 9, 11, 18], "float": [2, 3, 7, 9, 11, 12, 14, 15, 19, 49, 62, 84, 87, 88], "bool": [2, 3, 4, 6, 9, 10, 11, 13, 14, 18, 19, 88], "dict": [2, 4, 6, 7, 8, 9, 10, 11, 13, 14, 16, 18, 88], "one": [2, 5, 6, 7, 9, 10, 11, 13, 14, 16, 21, 22, 23, 27, 32, 38, 41, 42, 54, 63, 64, 65, 67, 68, 73, 84, 87, 89], "timestep": [2, 13, 14, 16, 88], "end": [2, 11, 13, 16, 27, 36, 37, 38, 40, 42, 43, 51, 52, 53, 63, 67, 70, 71, 84, 87, 89], "reach": [2, 11, 27, 29, 38, 41, 42, 59, 62, 70, 71, 82, 84, 88, 89], "necessari": [2, 4, 19, 44, 45, 46, 47, 48], "version": [2, 3, 4, 11, 84, 87, 88, 89], "0": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 87, 88, 89], "26": [2, 17, 88, 89], "wa": [2, 9, 10, 11, 14, 15, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 87, 89], "remov": [2, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "done": [2, 3, 9, 11, 13, 16, 17, 18, 87, 88, 89], "favor": 2, "clearer": 2, "had": 2, "critic": [2, 13], "bootstrap": [2, 18, 89], "algorithm": [2, 4, 83, 85, 87, 89], "paramet": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 83, 88], "provid": [2, 4, 5, 6, 9, 10, 11, 12, 13, 14, 16, 17, 19, 25, 38, 40, 44, 45, 46, 47, 48, 84, 88], "element": [2, 4, 5, 6, 8, 10, 14, 16, 83, 88], "numpi": [2, 4, 6, 8, 10, 11, 12, 14, 18, 84, 87, 88], "arrai": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 84, 88], "posit": [2, 5, 6, 7, 8, 9, 13, 14, 16, 19, 30, 50, 83, 84, 87, 88], "veloc": [2, 5, 7, 8, 83], "pole": [2, 69, 84], "cartpol": [2, 3, 9, 10, 13, 14, 15, 16, 82, 84], "result": [2, 7, 9, 10, 16, 84, 85], "whether": [2, 3, 6, 9, 13, 32, 87, 88, 89], "defin": [2, 4, 7, 11, 12, 13, 14, 15, 16, 86, 88, 89], "under": [2, 14, 15, 84, 87], "mdp": [2, 13, 16], "task": [2, 5, 11, 14, 16, 54, 60, 63, 88, 89], "neg": [2, 6, 9, 16, 69], "goal": [2, 22, 25, 30, 32, 34, 36, 38, 50, 55, 56, 57, 58, 59, 61, 64, 66, 68, 69, 75, 76, 77, 78, 79, 80, 84, 88], "move": [2, 11, 15, 16, 18, 21, 24, 25, 34, 35, 48, 51, 62, 65, 68, 69, 84, 88, 89], "lava": [2, 16, 49], "sutton": [2, 87], "barton": 2, "gridworld": [2, 88], "true": [2, 3, 7, 9, 10, 12, 13, 14, 16, 17, 19, 44, 45, 46, 47, 48, 87, 88], "condit": [2, 87, 89], "outsid": [2, 89], "scope": [2, 89], "satisfi": 2, "typic": [2, 9, 84], "timelimit": [2, 3, 11, 13, 16, 88, 89], "could": [2, 9, 14, 15, 16, 19, 84, 88, 89], "also": [2, 3, 6, 9, 10, 11, 13, 14, 16, 17, 19, 31, 51, 52, 63, 64, 66, 82, 83, 84, 87, 88, 89], "indic": [2, 9, 13, 18, 87, 89], "physic": [2, 81, 83, 84], "go": [2, 42, 69, 73, 87, 89], "out": [2, 8, 19, 28, 33, 49, 52, 60, 65, 70, 87, 88, 89], "bound": [2, 6, 11, 12, 16, 18, 89], "prematur": 2, "auxiliari": [2, 88], "diagnost": 2, "log": 2, "might": [2, 4, 6, 7, 11, 12, 13, 14, 15, 18, 84, 87, 88], "instanc": [2, 3, 4, 5, 7, 8, 9, 10, 11, 13, 15, 16, 17, 84], "describ": [2, 5, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84], "perform": [2, 9, 13, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84], "variabl": [2, 4, 6, 10, 13, 18, 84, 87, 88, 89], "hidden": [2, 83, 84], "individu": [2, 11, 88], "term": [2, 11, 82, 83, 87, 88], "combin": [2, 4, 9, 11, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79], "produc": [2, 11, 13, 88], "total": [2, 38], "In": [2, 6, 9, 10, 11, 12, 14, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 84, 87, 88, 89], "openai": [2, 3, 10, 11, 16, 18, 81, 86, 87, 89], "gym": [2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 81, 86, 87, 88, 89], "v26": 2, "distinguish": [2, 88, 89], "howev": [2, 3, 4, 5, 6, 7, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88, 89], "deprec": 2, "favour": [2, 18], "boolean": [2, 4, 9, 13, 18, 87], "valu": [2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 16, 18, 19, 68, 83, 87, 89], "case": [2, 4, 5, 6, 11, 12, 14, 16, 18, 51, 63, 88, 89], "further": [2, 68], "undefin": 2, "signal": [2, 11, 13, 16, 88, 89], "mai": [2, 6, 9, 10, 12, 13, 14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88], "emit": [2, 11, 13], "differ": [2, 4, 5, 9, 10, 11, 12, 13, 14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 87, 88, 89], "reason": [2, 18, 84], "mayb": 2, "underli": [2, 11, 13, 16], "solv": [2, 82, 83, 88], "successfulli": 2, "certain": [2, 41, 43, 87], "exceed": [2, 11, 13, 16, 87], "simul": [2, 19, 44, 45, 46, 47, 48, 83, 84, 87], "enter": [2, 9, 26, 28, 54], "invalid": [2, 6, 87], "option": [2, 3, 4, 5, 6, 9, 10, 11, 13, 14, 16, 18, 87, 88], "int": [2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 19, 87, 88], "none": [2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14, 87, 88], "intern": [2, 10, 14], "new": [2, 4, 11, 12, 13, 14, 16, 17, 18, 23, 26, 28, 40, 84, 87, 88, 89], "often": [2, 4, 18, 83, 88], "some": [2, 4, 5, 6, 10, 11, 13, 14, 15, 16, 18, 19, 35, 42, 60, 82, 83, 84, 87, 88], "explor": [2, 4, 48, 87], "generalis": 2, "polici": [2, 14, 15, 16, 18, 82, 83, 84, 86, 87, 89], "control": [2, 4, 6, 15, 16, 18, 19, 21, 24, 26, 27, 28, 29, 30, 35, 37, 39, 46, 47, 48, 51, 53, 60, 61, 63, 65, 66, 67, 68, 69, 70, 73, 74, 81], "alreadi": [2, 11, 14, 16, 84], "rng": [2, 4, 5, 6, 88], "therefor": [2, 4, 10, 17, 18], "right": [2, 6, 19, 21, 23, 24, 25, 26, 30, 34, 35, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 53, 55, 57, 58, 59, 61, 64, 69, 71, 72, 74, 75, 78, 79, 87, 88], "after": [2, 3, 9, 10, 13, 14, 16, 27, 31, 36, 41, 45, 49, 71, 84, 87, 88, 89], "never": 2, "again": [2, 88], "custom": [2, 4, 9, 10, 14, 16, 18, 19, 44, 45, 46, 47, 48, 84], "line": [2, 18, 41, 88], "correctli": [2, 14, 15, 88], "v0": [2, 3, 10, 11, 13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88, 89], "25": [2, 19, 44, 45, 46, 47, 48], "return_info": 2, "now": [2, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 87, 88, 89], "expect": [2, 4, 5, 6, 10, 13, 16], "prng": [2, 4, 5, 6], "doe": [2, 3, 5, 7, 9, 10, 11, 13, 17, 31, 46, 88, 89], "pass": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88], "chosen": [2, 6, 19], "sourc": [2, 83, 84, 87, 88, 89], "entropi": 2, "timestamp": 2, "dev": 2, "urandom": 2, "integ": [2, 5, 6, 9, 13, 14, 18, 19, 88], "even": [2, 3, 20, 22, 28, 29, 31, 33, 36, 37, 39, 49, 50, 51, 53, 54, 56, 60, 63, 65, 66, 67, 68, 70, 73, 77, 80, 87, 88], "exist": [2, 3, 4, 10, 11, 16], "usual": [2, 5, 6, 11, 13, 19, 44, 45, 46, 47, 48, 50, 87, 88], "been": [2, 9, 13, 16, 18, 84, 88, 89], "refer": [2, 9, 13, 16, 18, 88, 89], "minim": [2, 88, 89], "abov": [2, 5, 6, 9, 18, 19, 44, 45, 46, 47, 48, 83], "paradigm": 2, "specifi": [2, 4, 5, 6, 9, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 88], "how": [2, 4, 9, 10, 16, 50, 52, 53, 84, 87, 88, 89], "depend": [2, 5, 9, 14, 15, 19, 21, 22, 23, 24, 25, 26, 27, 30, 31, 32, 34, 35, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 52, 53, 55, 57, 58, 59, 61, 62, 64, 69, 71, 72, 74, 75, 76, 78, 79, 81, 82, 83, 84], "specif": [2, 3, 6, 13, 84, 89], "analog": [2, 19], "dictionari": [2, 4, 5, 9, 10, 11, 13, 14, 16, 87, 88], "complement": 2, "It": [2, 3, 5, 6, 9, 10, 11, 13, 16, 19, 20, 21, 22, 23, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 76, 77, 78, 79, 83, 84, 87, 88], "union": [2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 14], "renderfram": [2, 9], "list": [2, 4, 5, 6, 9, 10, 11, 14, 16, 19, 84, 87], "comput": [2, 9, 18, 61, 73, 84, 88], "frame": [2, 9, 13, 14, 19, 32, 84], "render_mod": [2, 9, 10, 11, 13, 14, 16, 18, 19, 86, 88], "wai": [2, 5, 11, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 87, 89], "most": [2, 4, 11, 13, 14, 16, 18, 19, 44, 45, 46, 47, 48, 87, 88], "achiev": [2, 19, 22], "appli": [2, 3, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 82, 84, 87, 88], "collect": [2, 10, 22, 25, 42, 56, 57, 60, 76, 84, 87], "As": [2, 10, 11, 16, 74, 83, 84, 85], "known": [2, 13, 26, 84], "__init__": [2, 5, 8, 11, 12, 14, 15, 87, 88], "initialis": [2, 13, 18], "By": [2, 3, 13, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "continu": [2, 4, 11, 12, 16, 24, 25, 82, 84, 87, 89], "current": [2, 6, 9, 11, 13, 14, 19, 87, 88], "displai": [2, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 88], "consumpt": 2, "occur": [2, 13, 88], "repres": [2, 5, 6, 9, 16, 18, 86, 88], "np": [2, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 87, 88], "ndarrai": [2, 3, 5, 6, 7, 8, 9, 12], "shape": [2, 4, 5, 6, 7, 8, 11, 12, 13, 14, 16, 88], "x": [2, 4, 6, 7, 84, 87, 88], "y": [2, 6, 19, 87], "3": [2, 5, 6, 7, 8, 9, 10, 13, 14, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 87, 88], "rgb": [2, 11, 13, 14, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "pixel": [2, 11, 84, 88], "imag": [2, 4, 10, 11, 13, 14, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84], "string": [2, 4, 6, 9, 14], "str": [2, 3, 4, 5, 6, 7, 9, 10, 13, 14, 18, 19], "stringio": [2, 85], "style": [2, 10, 13, 84], "represent": [2, 16, 89], "each": [2, 3, 4, 5, 6, 9, 10, 11, 12, 14, 16, 19, 38, 40, 41, 42, 43, 46, 54, 61, 63, 64, 65, 66, 67, 68, 69, 81, 82, 84, 85, 87, 88], "includ": [2, 3, 14, 16, 17, 18, 19, 84, 88, 89], "newlin": 2, "escap": [2, 52, 56], "sequenc": [2, 3, 4, 6, 7, 10, 14, 16, 19, 84], "color": [2, 5, 23, 34, 46, 64], "rgb_array_list": [2, 9, 11, 13], "ansi_list": 2, "base": [2, 4, 5, 10, 11, 12, 13, 14, 15, 16, 42, 51, 68, 81, 83, 84, 87, 88], "except": [2, 65, 68, 88], "rendercollect": [2, 11, 13], "pop": 2, "kei": [2, 3, 4, 5, 6, 9, 10, 11, 13, 14, 16, 19, 20, 50, 84, 87, 88, 89], "support": [2, 4, 5, 7, 9, 10, 11, 13, 14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 88], "longer": [2, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84], "accept": [2, 9, 13, 19, 88], "rather": [2, 18, 84, 87], "v1": [2, 3, 9, 10, 13, 14, 15, 16, 87], "type": [2, 4, 5, 6, 10, 11, 12, 14, 16, 18, 40, 84, 88], "discret": [2, 4, 5, 7, 8, 10, 12, 14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 85, 87, 88], "give": [2, 22, 23, 40, 41, 87], "2": [2, 5, 6, 7, 8, 9, 10, 12, 14, 15, 19, 20, 21, 23, 24, 25, 26, 27, 29, 30, 32, 34, 35, 37, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50, 52, 55, 57, 58, 59, 61, 62, 64, 69, 71, 72, 73, 74, 75, 76, 78, 79, 84, 87, 88], "mean": [2, 16, 18, 88], "two": [2, 5, 6, 9, 10, 13, 18, 19, 21, 32, 73, 83, 88], "1": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 87, 88, 89], "box": [2, 4, 5, 7, 8, 10, 11, 12, 14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 88], "4028234663852886e": 2, "38": 2, "4": [2, 6, 7, 9, 10, 11, 12, 13, 14, 16, 19, 21, 23, 24, 25, 26, 28, 30, 32, 34, 35, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 52, 55, 57, 58, 59, 61, 62, 63, 64, 71, 72, 74, 75, 76, 78, 79, 87, 88], "float32": [2, 5, 6, 7, 8, 10, 11, 12, 14, 16], "denot": 2, "well": [2, 4, 26, 68, 84, 88], "high": [2, 5, 6, 7, 8, 10, 14, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84], "8000002e": 2, "00": 2, "4028235e": 2, "1887903e": 2, "01": [2, 15], "dtype": [2, 4, 5, 6, 8, 10, 14, 88], "low": [2, 5, 6, 7, 8, 14, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84], "ani": [2, 4, 5, 8, 9, 13, 14, 17, 18, 19, 40, 44, 45, 46, 47, 48, 49, 67, 87, 88, 89], "etc": [2, 4, 11, 63, 66, 70, 88, 89], "determin": [2, 6, 19, 84, 88, 89], "inf": [2, 14], "envspec": [2, 3], "normal": [2, 6, 11, 13], "finish": 2, "code": [2, 4, 5, 9, 10, 11, 13, 14, 15, 84, 87, 88], "clean": 2, "up": [2, 5, 6, 10, 14, 19, 20, 22, 23, 24, 25, 26, 28, 29, 30, 32, 35, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 51, 52, 55, 57, 62, 64, 65, 66, 68, 69, 72, 73, 74, 75, 78, 79, 83, 87, 88], "window": [2, 9, 38, 84, 88], "http": [2, 9, 11, 19, 84, 88], "connect": [2, 5], "properti": [2, 4, 11, 89], "unwrap": [2, 11, 16], "non": [2, 4, 7, 9, 88, 89], "wrap": [2, 3, 9, 10, 11, 12, 13, 14, 15, 16, 88], "_np_random": 2, "meth": 2, "much": [2, 19, 44, 45, 46, 47, 48, 52, 53, 88, 89], "creat": [2, 3, 6, 8, 9, 10, 13, 16, 29, 84, 85, 87], "creation": [2, 10, 88], "tutori": [2, 16, 18, 87], "gymnasium": [3, 4, 5, 6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 89], "allow": [3, 4, 5, 9, 11, 12, 14, 15, 16, 18, 19, 49, 67, 88], "load": 3, "pre": [3, 18], "sever": [3, 6, 11, 13, 16, 18, 19, 48, 84], "id": [3, 10, 88], "kwarg": [3, 9, 10, 11, 88], "env": [3, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 86, 87, 89], "liter": 3, "mountaincar": 3, "mountaincarcontinu": 3, "supportsfloat": [3, 6, 11, 18], "pendulum": [3, 10, 14, 16, 82], "acrobot": [3, 82, 84], "lunarland": [3, 13, 16, 18, 84, 86], "v2": [3, 12, 13, 16, 18, 86], "lunarlandercontinu": [3, 12], "bipedalwalk": [3, 11, 12, 16], "v3": [3, 11, 12, 16, 83], "bipedalwalkerhardcor": 3, "carrac": [3, 9, 14], "blackjack": [3, 16], "frozenlak": [3, 9], "frozenlake8x8": 3, "cliffwalk": 3, "taxi": 3, "reacher": [3, 11, 83], "v4": [3, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "pusher": 3, "invertedpendulum": [3, 83], "inverteddoublependulum": 3, "halfcheetah": [3, 83], "hopper": [3, 83], "swimmer": [3, 83], "walker2d": 3, "ant": [3, 83], "humanoidstandup": [3, 83], "humanoid": [3, 39, 83], "accord": [3, 5, 6, 10], "given": [3, 6, 11, 14, 65, 68, 82, 89], "find": [3, 19, 20, 44, 45, 46, 47, 48, 54, 63, 75, 84, 88], "avail": [3, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 88], "modul": [3, 8, 88], "eg": [3, 9, 84, 88], "max_episode_step": [3, 13, 88], "length": [3, 5, 6, 9, 11, 13, 14, 84], "autoreset": [3, 10, 88], "autoresetwrapp": [3, 11, 13, 88], "apply_api_compat": [3, 13, 17], "stepapicompat": [3, 11, 13, 17], "argument": [3, 4, 5, 6, 7, 9, 10, 14, 16, 81, 82, 85, 88], "fals": [3, 9, 10, 13, 14, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 87, 88], "disable_env_check": [3, 10], "checker": [3, 10], "addit": [3, 4, 10, 11, 13, 16, 18, 19, 25, 36, 65, 69, 82, 84, 87, 88], "constructor": [3, 4, 5, 6, 9, 11, 16, 88], "rais": [3, 6, 7, 8, 9, 10, 13, 14], "error": [3, 6, 9, 11, 13, 89], "entry_point": [3, 88], "callabl": [3, 8, 9, 10, 13, 14, 15], "reward_threshold": [3, 88], "nondeterminist": [3, 88], "order_enforc": [3, 88], "syntax": 3, "namespac": [3, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88], "env_nam": [3, 17], "v": [3, 6, 67, 87], "keyword": [3, 5, 10, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88], "entri": 3, "point": [3, 7, 9, 11, 19, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 45, 49, 50, 53, 60, 61, 62, 63, 64, 65, 66, 68, 70, 71, 72, 74, 75, 78, 84, 89], "threshold": [3, 88], "consid": [3, 14, 82, 83, 84, 88], "learnt": 3, "knowledg": 3, "limit": [3, 16, 35, 42, 49, 50, 63, 68], "enabl": [3, 11, 19, 84], "order": [3, 4, 5, 11, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 83, 84, 88], "enforc": 3, "correct": [3, 88, 89], "disabl": [3, 13], "recommend": [3, 10, 13, 18, 19, 44, 45, 46, 47, 48, 84, 87, 88], "onli": [3, 4, 5, 6, 7, 10, 11, 12, 13, 14, 19, 21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50, 52, 55, 57, 58, 59, 61, 62, 64, 65, 66, 67, 68, 69, 71, 72, 74, 75, 76, 78, 79, 84, 87, 88], "env_id": 3, "retriev": [3, 13, 39, 42, 68], "global": 3, "superclass": [4, 12, 14, 15], "crucial": 4, "thei": [4, 10, 13, 14, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 85, 88], "serv": 4, "variou": [4, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84], "purpos": [4, 84], "clearli": 4, "interact": [4, 9, 19, 84, 87, 88], "environ": [4, 6, 8, 11, 12, 14, 15, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 85, 89], "look": [4, 9, 11, 13, 15, 16, 19, 21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 38, 40, 41, 42, 43, 52, 55, 57, 58, 59, 61, 62, 64, 67, 69, 71, 72, 74, 75, 76, 78, 79, 88, 89], "like": [4, 6, 9, 11, 12, 13, 14, 15, 16, 21, 22, 23, 24, 25, 26, 27, 28, 30, 32, 34, 35, 38, 40, 41, 42, 43, 52, 55, 57, 58, 59, 60, 61, 62, 63, 64, 69, 71, 72, 74, 75, 76, 78, 79, 84, 88], "u": [4, 6, 11, 15, 19, 84, 85, 87, 88], "work": [4, 9, 11, 13, 14, 19, 84, 87], "highli": [4, 18, 19, 81, 82, 88], "structur": [4, 5, 7, 84, 88], "data": [4, 7, 9, 11, 18, 87, 88], "form": [4, 5, 6, 13, 88], "painlessli": 4, "transform": [4, 7, 9, 11, 12, 13], "them": [4, 11, 13, 19, 21, 22, 23, 26, 27, 31, 35, 41, 62, 71, 84], "flat": [4, 5, 6, 7, 14], "sampl": [4, 5, 6, 7, 8, 9, 10, 14, 15, 16, 18, 87, 88], "especi": [4, 15, 88], "hierarch": 4, "via": [4, 5, 11, 13, 14, 15, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 88], "build": [4, 11, 21, 38, 42, 84], "express": [4, 9], "inherit": [4, 11, 12, 14, 15, 16, 88], "cover": [4, 87], "parametr": 4, "probabl": [4, 19, 87, 89], "distribut": [4, 5, 6], "batch": [4, 8, 10], "vectorenv": 4, "moreov": [4, 13, 19, 22, 32, 88], "implement": [4, 5, 10, 12, 13, 14, 15, 16, 17, 18, 19, 84, 85, 88], "handl": [4, 10, 87], "care": [4, 69], "immut": 4, "mask": [4, 5, 6, 18, 84], "t_cov": 4, "randomli": [4, 5, 88], "uniform": [4, 6], "bounded": 4, "int8": [4, 6], "member": [4, 52], "possibli": [4, 5, 6, 8, 11, 13, 16, 84], "subspac": [4, 5, 6, 7], "to_json": 4, "sample_n": 4, "jsonabl": 4, "from_json": 4, "complex": [4, 5, 84, 87], "matric": 4, "multidiscret": [4, 5, 7, 8, 10, 16, 88], "binari": [4, 6, 16, 88], "hold": [4, 87], "down": [4, 6, 19, 23, 25, 26, 32, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 51, 52, 55, 57, 59, 60, 62, 64, 72, 74, 75, 78, 79, 87, 88, 89], "button": [4, 6, 9, 16], "multibinari": [4, 5, 7, 8, 16], "multipl": [4, 5, 6, 8, 10, 84], "ax": [4, 6, 88], "messag": [4, 84], "mission": [4, 51, 53, 54], "detail": [4, 9, 13, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 88], "join": 4, "togeth": [4, 19, 83], "vectoris": 4, "separ": [4, 5, 18, 88], "readabl": [4, 5], "fix": [4, 5, 6, 11, 13, 15, 16, 18, 51, 83, 88], "unord": 4, "entiti": 4, "select": [4, 6, 41, 84], "graph": [4, 7, 16], "node": [4, 5, 7], "edg": [4, 5, 7], "flatten": [4, 7, 11, 83, 88], "unflatten": [4, 7], "neural": [4, 7, 84], "network": [4, 7, 84], "flatdim": [4, 7], "dimens": [4, 6, 7, 14, 84], "flatten_spac": [4, 7], "revers": [4, 7], "size": [4, 13, 88], "batch_spac": [4, 8], "concaten": [4, 7, 8, 83], "iter": [4, 5, 8, 10], "create_empty_arrai": [4, 8], "create_shared_memori": [4, 8], "read_from_shared_memori": [4, 8], "write_to_shared_memori": [4, 8], "spaces_kwarg": 5, "constitu": 5, "usag": [5, 6, 7, 11], "ordereddict": [5, 8, 14], "nest": [5, 8, 84], "ext_control": 5, "5": [5, 6, 7, 8, 12, 13, 19, 21, 23, 24, 25, 26, 29, 30, 32, 35, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 52, 55, 57, 58, 59, 61, 62, 64, 71, 72, 74, 75, 76, 78, 79, 84, 87, 88], "inner_st": 5, "charg": 5, "100": [5, 7, 13, 33, 42, 65, 66, 84], "system_check": 5, "10": [5, 6, 12, 19, 26, 32, 44, 45, 46, 47, 48, 55, 62, 65, 68, 84, 88], "job_statu": 5, "progress": [5, 74], "conveni": [5, 11, 16, 88], "easili": [5, 11, 84], "flattenobserv": [5, 11, 14, 88], "similar": [5, 18, 23, 34, 88], "deal": 5, "instanti": [5, 9, 13, 14, 15, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88], "either": [5, 6, 7, 9, 13, 16, 19, 41, 51], "avoid": [5, 8, 11, 16, 19, 22, 23, 25, 30, 31, 38, 40, 56, 57, 59, 64, 66, 67, 72], "independ": [5, 6, 10], "same": [5, 7, 9, 10, 14, 50, 89], "attr": 5, "warn": [5, 9, 10, 13], "guarante": [5, 19], "uniqu": [5, 81, 82, 83], "sub": [5, 10, 68], "precis": 5, "cartesian": [5, 6], "product": [5, 6], "03633198": 5, "42370757": 5, "involv": [5, 81, 84, 88], "reproduc": 5, "method": [5, 9, 12, 13, 14, 15, 17, 84, 88], "draw": [5, 87, 88], "42": [5, 6, 86], "54": 5, "finit": [5, 6, 12, 89], "a_0": 5, "dot": [5, 6, 88], "a_n": 5, "a_i": 5, "belong": [5, 8, 84], "n": [5, 6, 7, 8, 16, 19, 84, 87], "0259352": 5, "80977976": 5, "80066574": 5, "77165383": 5, "must": [5, 7, 8, 9, 10, 11, 12, 13, 14, 16, 18, 19, 20, 21, 24, 26, 27, 28, 29, 31, 35, 36, 37, 39, 42, 43, 52, 56, 58, 59, 64, 84, 88, 89], "length_mask": 5, "sample_mask": 5, "drawn": [5, 6], "geometr": 5, "featur": [5, 6, 84], "feature_spac": 5, "node_spac": [5, 7], "edge_spac": [5, 7], "seri": [5, 16], "adjac": 5, "matrix": 5, "edge_link": [5, 7], "num_nod": 5, "num_edg": 5, "graphinst": [5, 7], "between": [5, 6, 13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 88, 89], "don": [5, 11, 18, 19, 35, 44, 45, 46, 47, 48, 68, 87, 88, 89], "edge_mask": 5, "multipli": 5, "attribut": [5, 16, 88], "_gener": 6, "unbound": 6, "mathbb": 6, "interv": [6, 16], "There": [6, 11, 16, 50, 51, 63, 82, 83, 84, 88], "common": [6, 11, 14, 16, 89], "ident": [6, 10, 14], "lower": [6, 16], "upper": [6, 16], "construct": [6, 19, 44, 45, 46, 47, 48, 88], "scalar": [6, 12], "respect": [6, 10, 11, 13, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "assum": [6, 14, 88], "across": [6, 8, 25, 35, 45, 46, 49], "infer": [6, 83], "essenti": 6, "valueerror": [6, 7, 8, 10, 13, 14], "coordin": [6, 11, 14, 84], "shift": [6, 16], "exponenti": [6, 11, 15], "unsupport": 6, "is_bound": 6, "manner": [6, 11, 14, 50], "both": [6, 10, 13, 14, 16, 17, 82, 84, 88, 89], "sens": [6, 84], "One": [6, 16, 84], "neither": [6, 13], "nor": [6, 13], "consist": [6, 11, 14, 16, 19, 32, 83, 84, 87, 88], "mani": [6, 13, 14, 16, 19, 25, 28, 32, 50, 53, 68, 78, 84, 87, 88], "subset": [6, 12, 19, 44, 45, 46, 47, 48, 88], "smallest": 6, "uniformli": [6, 19, 88], "infeas": 6, "sort": 6, "fair": 6, "coin": [6, 84], "toss": 6, "per": [6, 10, 32, 50, 73, 84, 89], "nvec": 6, "int64": [6, 7], "game": [6, 9, 13, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 57, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 81, 87, 88], "keyboard": [6, 9], "alwai": [6, 7, 13, 19, 88], "noop": [6, 9, 13, 19, 21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 52, 55, 57, 58, 59, 61, 62, 64, 69, 71, 72, 74, 75, 76, 78, 79], "nintendo": 6, "conceptu": 6, "arrow": [6, 62], "left": [6, 19, 21, 23, 24, 25, 26, 30, 34, 35, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 55, 57, 58, 59, 61, 64, 68, 69, 71, 72, 74, 75, 78, 79, 87, 88], "param": 6, "min": [6, 12], "max": [6, 12, 13, 87], "press": [6, 9, 16], "although": 6, "rare": 6, "d": [6, 9], "categor": 6, "vector": [6, 9, 11], "count": [6, 87], "complic": [6, 11], "kind": 6, "unless": [6, 11, 88], "max_length": 6, "min_length": 6, "charset": 6, "frozenset": 6, "6": [6, 7, 19, 23, 24, 25, 26, 30, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 52, 55, 57, 59, 73, 74, 75, 78, 79], "7": [6, 9, 19, 23, 25, 26, 30, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 52, 55, 57, 59, 74, 75, 78, 79], "8": [6, 9, 10, 17, 19, 21, 23, 25, 26, 28, 30, 34, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 52, 55, 57, 58, 74, 78, 79, 87], "9": [6, 8, 10, 19, 23, 26, 31, 39, 44, 45, 46, 47, 48, 52, 55, 65, 74, 79], "c": [6, 67, 84], "f": [6, 14, 15], "h": 6, "j": [6, 19], "k": [6, 7, 9, 13], "l": [6, 13], "m": [6, 7, 19, 88], "o": 6, "p": 6, "q": [6, 64, 89], "w": [6, 9], "z": [6, 87], "compris": 6, "charact": [6, 9, 52, 63], "b5": 6, "hello": 6, "0123456789": 6, "digit": [6, 84], "inclus": [6, 19], "prevent": [6, 10, 41, 84], "empti": [6, 8, 13, 68, 87], "english": 6, "alphabet": 6, "plu": [6, 35], "latin": 6, "charlist": 6, "zero": [6, 8, 84, 87, 88, 89], "matter": 6, "equival": [7, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "would": [7, 12, 14, 15, 88], "notimplementederror": 7, "cannot": [7, 8, 13, 16, 18, 88, 89], "attempt": 7, "compound": 7, "func": 7, "oper": [7, 13], "itself": [7, 10, 11, 13, 16], "boundari": 7, "while": [7, 18, 19, 22, 23, 38, 53, 56, 57, 58, 59, 62, 64, 66, 68, 72, 75, 77, 84, 87, 88, 89], "being": [7, 13, 18, 39, 84, 87], "exactli": 7, "origin": [7, 10, 12, 13, 14, 18, 84], "effect": [7, 8, 11, 13, 14, 16, 19, 44, 45, 46, 47, 48, 87], "flattenend": 7, "60": [7, 52, 65, 84], "recurs": 7, "12": [7, 19, 26, 28, 32, 34, 44, 45, 46, 47, 48, 52, 55, 67, 87], "hot": 7, "match": [7, 10, 12, 73], "copi": [8, 10, 84, 88], "item": [8, 9, 84, 87], "_": [8, 9, 10, 11, 16, 86], "6348213": 8, "28607962": 8, "60760117": 8, "87383074": 8, "192658": 8, "2148103": 8, "99644893": 8, "08304597": 8, "7238421": 8, "35848552": 8, "1533453": 8, "67958736": 8, "49076623": 8, "38661423": 8, "7975036": 8, "93317133": 8, "stopiter": 8, "fn": 8, "built": [8, 18, 84], "multi_binari": 8, "multi_discret": 8, "ctx": 8, "multiprocess": [8, 10], "opt": 8, "hostedtoolcach": 8, "15": [8, 19, 41, 44, 45, 46, 47, 48, 52, 71, 84], "x64": 8, "lib": 8, "python3": 8, "process": [8, 9, 10, 14, 16, 88, 89], "eventu": 8, "shared_memori": [8, 10], "customspaceerror": 8, "read": [8, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "forward": [8, 30, 51], "vice": [8, 13], "versa": [8, 13], "side": [8, 14, 21, 34, 48, 50], "write": [8, 10, 88], "num_env": [8, 10], "plai": [9, 16, 29, 41, 54, 73, 78, 84, 87, 88], "transpos": [9, 88], "zoom": 9, "callback": 9, "keys_to_act": 9, "dw": 9, "particularli": [9, 13], "verifi": 9, "level": [9, 16, 19, 26, 42, 64, 72, 84], "preprocess": [9, 11], "unplay": 9, "wish": [9, 14, 18], "real": [9, 50, 84], "statist": 9, "playplot": 9, "here": [9, 88], "last": [9, 13, 40, 41, 51, 88, 89], "150": 9, "def": [9, 11, 12, 14, 15, 87, 88], "obs_t": 9, "obs_tp1": 9, "rew": [9, 89], "plotter": 9, "render_fp": [9, 13, 88], "30": [9, 13, 19, 62, 65], "amount": [9, 38, 40, 41, 43, 49, 68], "input": [9, 10, 16, 87], "receiv": [9, 10, 16, 29, 32, 36, 38, 39, 45, 51, 54, 87, 89], "map": [9, 14, 16, 37, 87, 88], "unicod": 9, "suppos": 9, "trigger": 9, "key_to_act": 9, "ord": [9, 88], "unknown": [9, 84], "horizon_timestep": 9, "plot_nam": 9, "live": [9, 22, 25, 28, 29, 31, 34, 38, 39, 42, 49, 53, 54, 60, 66, 71, 87], "transit": [9, 16, 19, 44, 45, 46, 47, 48, 89], "compute_metr": 9, "obs_tp": 9, "cumulative_reward": 9, "linalg": [9, 88], "norm": [9, 88], "its": [9, 10, 12, 13, 34, 40, 63, 75, 80, 83, 84], "along": [9, 11, 16, 17, 18, 52, 53, 55, 66], "conjunct": 9, "evolv": 9, "200": [9, 43, 66], "immedi": [9, 11, 15, 88], "cumul": [9, 11, 13], "magnitud": 9, "your_env": 9, "len": [9, 12], "horizon": [9, 68, 89], "titl": [9, 87], "dependencynotinstal": [9, 13], "matplotlib": [9, 87], "playablegam": 9, "process_ev": 9, "event": [9, 84, 88], "particular": [9, 11, 14, 16, 17, 89], "keep": [9, 11, 13, 27, 39, 58, 61, 69, 70, 78, 88], "track": [9, 11, 13, 70], "exit": [9, 10], "save_video": 9, "video_fold": [9, 13], "episode_trigg": [9, 13], "step_trigg": [9, 13], "video_length": [9, 13], "name_prefix": [9, 13], "rl": [9, 13, 86, 87, 89], "episode_index": 9, "step_starting_index": 9, "extract": 9, "compos": 9, "record": [9, 11], "store": [9, 10, 13], "iff": [9, 13, 88], "isn": 9, "entir": [9, 13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84], "snippet": [9, 13], "captur": [9, 13, 77], "Will": [9, 13], "prepend": [9, 13], "filenam": [9, 13], "moviepi": 9, "imagesequenceclip": 9, "durat": 9, "step_index": 9, "199": 9, "capped_cubic_video_schedul": 9, "episode_id": 9, "27": 9, "729": 9, "1000": [9, 13, 16, 66, 68, 86], "2000": 9, "3000": 9, "schedul": 9, "step_api_compat": [9, 17], "step_return": 9, "output_truncation_bool": [9, 13], "is_vector_env": 9, "doc": [9, 13], "ob": [9, 11, 14, 87], "interfac": [9, 84, 86], "conflict": [9, 84], "written": [9, 11, 18, 84], "final": [9, 10, 13, 51, 88, 89], "desir": 9, "oldenv": 9, "vec_env": 9, "convert_to_terminated_truncated_step_api": [9, 17], "irrespect": 9, "convert_to_done_step_api": 9, "omit": [9, 83], "env_check": 9, "check_env": 9, "skip_render_check": 9, "invas": [9, 72], "farama": [9, 11, 88], "org": [9, 19, 84], "content": 9, "environment_cr": [9, 88], "ignor": [9, 19, 87], "skip": [9, 13, 19, 88], "ci": 9, "parallel": 10, "linear": 10, "speed": [10, 30, 84], "taken": [10, 13, 42, 48, 82, 88], "wait": [10, 42, 44, 68, 89], "until": [10, 11, 41, 54, 88], "overwritten": [10, 11], "final_observ": [10, 13], "final_info": [10, 13], "asyncvectorenv": 10, "syncvectorenv": 10, "single_observation_spac": 10, "single_action_spac": 10, "v25": [10, 18], "old": [10, 11, 13, 17, 86], "vectorlistinfo": [10, 11, 13], "rememb": [10, 13, 88], "share": 10, "other": [10, 11, 12, 13, 14, 17, 25, 34, 37, 44, 50, 83, 87, 88], "word": 10, "02240574": 10, "03439831": 10, "03904812": 10, "02810693": 10, "01586068": 10, "01929009": 10, "02394426": 10, "04016077": 10, "01314174": 10, "03893502": 10, "02400815": 10, "0038326": 10, "instead": [10, 14, 16, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88], "00122802": 10, "16228443": 10, "02521779": 10, "23700266": 10, "00788269": 10, "17490888": 10, "03393489": 10, "31735462": 10, "04918966": 10, "19421194": 10, "02938497": 10, "29495203": 10, "releas": [10, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 88], "resourc": [10, 87, 88], "viewer": 10, "close_extra": 10, "synchron": 10, "asynchron": 10, "garbag": 10, "program": [10, 84], "04456399": 10, "04653909": 10, "01326909": 10, "02099827": 10, "03073904": 10, "00145001": 10, "03088818": 10, "03131252": 10, "03468829": 10, "01500225": 10, "01230312": 10, "01825218": 10, "registri": [10, 16, 17], "env_fn": 10, "context": 10, "daemon": 10, "worker": [10, 62], "pipe": 10, "commun": 10, "lambda": [10, 14, 15, 87], "81": 10, "62": 10, "8286432": 10, "5597771": 10, "90249056": 10, "85009176": 10, "5266346": 10, "60007906": 10, "back": [10, 11, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 46, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81], "improv": 10, "effici": [10, 14, 84], "larg": [10, 11, 84], "subprocess": 10, "flag": [10, 84], "turn": [10, 13, 18, 22, 23], "quit": [10, 88], "head": 10, "spawn": 10, "children": 10, "overrid": [10, 11], "inner": 10, "logic": [10, 88], "advanc": [10, 84], "degre": [10, 14], "flexibl": [10, 84], "chanc": 10, "shoot": [10, 26, 35, 37, 41, 42, 49, 50, 59, 62, 66, 71, 72, 80], "yourself": [10, 42, 62, 87, 88], "foot": 10, "thu": [10, 19, 44, 45, 46, 47, 48, 84], "own": [10, 18, 34, 68], "_worker": 10, "_worker_shared_memori": 10, "runtimeerror": 10, "serial": 10, "modular": [11, 12, 14, 15, 16, 84, 88], "behavior": [11, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84, 88], "modif": 11, "without": [11, 16, 40, 87, 88], "alter": [11, 16, 19, 88], "lot": [11, 16, 87], "boilerpl": [11, 16, 88], "chain": [11, 16], "rescaleact": [11, 12, 16], "base_env": [11, 16], "wrapped_env": [11, 12, 13, 16, 88], "min_act": [11, 12, 16], "max_act": [11, 12, 16], "access": [11, 13, 18, 49, 84], "underneath": [11, 16], "anoth": [11, 34, 89], "orderenforc": [11, 13, 16, 88], "get": [11, 16, 19, 38, 41, 42, 43, 50, 60, 61, 62, 63, 65, 66, 67, 72, 87, 89], "layer": [11, 16, 84], "bare": 11, "just": [11, 16, 18, 44, 50, 67], "box2d": [11, 16], "bipedal_walk": [11, 16], "0x7f87d70712d0": [11, 16], "three": [11, 19, 22, 25, 27, 39, 47, 53, 60, 65, 66, 67, 68, 88], "thing": [11, 14, 19], "do": [11, 13, 14, 15, 19, 32, 43, 64, 68, 69, 84, 88], "Such": 11, "actionwrapp": [11, 12], "observationwrapp": [11, 14, 88], "rewardwrapp": [11, 15], "present": [11, 84, 87, 88, 89], "section": [11, 19, 69, 87, 88], "found": [11, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 83, 87], "github": [11, 83, 88], "com": [11, 84, 88], "foundat": [11, 88], "forget": [11, 88], "commonli": [11, 16], "page": [11, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84], "descript": [11, 84, 88], "ataripreprocess": [11, 13], "misc": 11, "tp": 11, "atari": [11, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 87], "clipact": [11, 12, 16], "clip": [11, 15, 16, 88], "envcompat": [11, 13, 17, 18], "compat": [11, 14, 16, 84, 86], "21": [11, 17, 87], "filterobserv": [11, 14], "filter": 11, "request": 11, "framestack": [11, 13], "anobserv": 11, "stack": [11, 14], "roll": [11, 14, 32], "grayscaleobserv": [11, 14], "grai": [11, 13], "scale": [11, 13, 15, 19, 84], "humanrend": [11, 13], "normalizeobserv": [11, 14], "center": [11, 14, 84], "unit": [11, 14, 52], "varianc": [11, 14, 15], "normalizereward": [11, 15], "averag": [11, 15, 89], "pixelobservationwrapp": [11, 14], "augment": [11, 14], "obtain": [11, 13, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 89], "ad": [11, 13, 14, 16, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 46, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 83, 84, 88], "replac": [11, 18, 87], "recordepisodestatist": [11, 13, 18], "recordvideo": [11, 13, 18], "rollout": [11, 13], "save": [11, 13, 18], "rescal": [11, 16], "resizeobserv": [11, 14], "axbxc": [11, 14], "resiz": [11, 13], "timeawareobserv": [11, 14, 16], "trajectori": [11, 14, 15], "append": [11, 14], "transformobserv": [11, 14], "transformreward": [11, 15], "th": 11, "sometim": [11, 15, 88], "still": [11, 17, 19, 87], "let": [11, 12, 15, 19, 34, 84, 87, 88], "penal": [11, 69], "energi": [11, 84], "weight": [11, 84, 89], "those": [11, 21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 38, 40, 41, 42, 43, 52, 55, 57, 58, 59, 61, 62, 64, 69, 71, 72, 74, 75, 76, 78, 79, 83], "nevertheless": 11, "reacherrewardwrapp": 11, "reward_dist_weight": 11, "reward_ctrl_weight": 11, "reward_dist": 11, "reward_ctrl": 11, "suffici": [11, 25, 27, 29, 31, 36, 87], "simpli": [12, 13, 14, 15, 19, 88], "overwrit": [12, 14, 15], "domain": [12, 84], "sai": [12, 13], "discreteact": 12, "disc_to_cont": 12, "act": [12, 87], "__name__": 12, "__main__": 12, "print": [12, 87, 88], "among": [12, 14, 82, 83], "biped": 12, "walker": [12, 83], "affin": 12, "75": 12, "noop_max": 13, "frame_skip": 13, "screen_siz": 13, "84": 13, "terminal_on_life_loss": 13, "grayscale_ob": 13, "grayscale_newaxi": 13, "scale_ob": 13, "2600": [13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "guidelin": 13, "machado": [13, 19], "et": [13, 19], "al": [13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 87], "2018": [13, 19], "revisit": [13, 19], "arcad": [13, 19, 26, 42, 44, 45, 46, 47, 48, 84], "evalu": [13, 19, 84, 87], "protocol": [13, 19], "open": [13, 19, 32, 83, 84, 88], "problem": [13, 19, 86, 87, 89], "stage": 13, "op": 13, "pool": 13, "recent": [13, 14, 15, 17, 84], "life": [13, 25, 38, 42, 66, 70], "lost": [13, 28, 36, 54, 67, 71], "loss": 13, "off": [13, 18, 36, 50, 58, 66], "Not": 13, "squar": [13, 14, 67, 88], "210x180": 13, "84x84": 13, "grayscal": [13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "colour": 13, "greyscal": 13, "255": [13, 14, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88], "No": 13, "frequenc": 13, "experi": [13, 84, 87], "whenev": [13, 25, 28, 88], "channel": 13, "axi": [13, 87], "dimension": [13, 16, 23, 84, 88], "memori": [13, 14], "optim": [13, 19, 84], "benefit": 13, "opencv": 13, "caus": [13, 16, 51], "new_ob": 13, "final_reward": 13, "final_termin": 13, "final_trunc": 13, "final_don": 13, "prior": [13, 84], "alongsid": [13, 84], "previou": [13, 89], "re": [13, 50, 65, 68, 88], "old_env": 13, "legacyenv": 13, "retun": 13, "modern": [13, 84], "convers": [13, 84], "passiveenvcheck": [13, 16], "cartpoleenv": 13, "customenv": 13, "manual": [13, 16, 19, 44, 45, 46, 47, 48, 84], "unregist": 13, "surround": [13, 84], "test": [13, 84, 88], "haven": 13, "screen": [13, 19, 21, 25, 29, 34, 35, 37, 45, 51, 57, 67, 68], "nativ": [13, 85], "nonativerend": 13, "disable_render_order_enforc": 13, "classic_control": [13, 18, 82], "resetneed": 13, "deque_s": 13, "At": [13, 16, 28, 38, 41, 52], "_episod": 13, "elaps": 13, "sinc": [13, 17, 19, 44, 45, 46, 47, 48, 81, 83, 84, 88, 89], "begin": [13, 18, 25, 28, 40, 65, 66, 67, 68, 87, 88], "num": [13, 19, 21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 52, 55, 57, 58, 59, 61, 62, 64, 69, 71, 72, 74, 75, 76, 78, 79], "buffer": [13, 14, 84], "return_queu": 13, "length_queu": 13, "intermitt": 13, "hundredth": 13, "emploi": 13, "stop": [13, 16, 62, 72, 80, 84, 87, 89], "span": 13, "strictli": 13, "pop_fram": 13, "reset_clean": 13, "clear": [13, 72], "issu": [13, 16, 18, 19, 88], "place": [13, 23, 88], "part": [13, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 83, 89], "\u01f9one": 13, "intend": [13, 84], "around": [13, 29, 81, 84], "outermost": 13, "actual": [13, 88], "_k": 13, "classic": [13, 16, 18, 89], "reflect": 14, "2d": [14, 84], "navig": [14, 28, 63, 88], "agent_posit": 14, "target_posit": 14, "throw": [14, 53], "awai": [14, 22, 61], "freedom": 14, "target": [14, 35, 84, 87, 88, 89], "rel": [14, 88], "relativeposit": [14, 88], "ideal": 14, "subclass": 14, "accordingli": [14, 68, 88], "were": [14, 18, 36, 81, 85, 88], "incorrectli": [14, 89], "randn": 14, "08319338": 14, "04635121": 14, "07394746": 14, "20877492": 14, "filter_kei": 14, "00067088": 14, "01860439": 14, "04772898": 14, "01911527": 14, "04560107": 14, "04466959": 14, "0328232": 14, "02367178": 14, "04649447": 14, "14996664": 14, "03329664": 14, "25847703": 14, "96": [14, 19], "27648": 14, "num_stack": 14, "lz4_compress": 14, "lazyfram": 14, "fill": [14, 28, 88], "lz4": 14, "compress": 14, "keep_dim": 14, "uint8": [14, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "singleton": 14, "axbx1": 14, "axb": 14, "epsilon": [14, 15, 84, 87], "1e": [14, 15, 87], "08": [14, 15], "past": [14, 15], "newli": [14, 15], "stabil": [14, 15], "pixels_onli": 14, "render_kwarg": 14, "pixel_kei": 14, "choos": [14, 88], "odict_kei": 14, "400": 14, "600": [14, 84], "discard": 14, "assertionerror": 14, "show": [14, 18, 19, 29, 35, 87], "typeerror": 14, "unexpect": 14, "64": [14, 19], "03810719": 14, "03522411": 14, "02231044": 14, "01088205": 14, "03881167": 14, "16021058": 14, "0220928": 14, "28875574": 14, "becaus": [15, 87, 88], "intrins": 15, "gain": [15, 29, 64, 70, 71, 74], "numer": 15, "clipreward": 15, "min_reward": 15, "max_reward": 15, "invari": 15, "incorrect": [15, 89], "gamma": [15, 89], "99": 15, "discount": [15, 89], "factor": 15, "project": [16, 18, 84, 87], "mountain": [16, 82], "car": [16, 28, 43, 82, 84], "four": [16, 28, 38, 87], "introduc": [16, 17, 18], "core": [16, 84], "markov": [16, 89], "decis": [16, 18, 84, 89], "theori": [16, 84], "perfect": 16, "reconstruct": 16, "miss": [16, 69], "compon": [16, 88], "veri": [16, 84, 88], "easi": [16, 54, 84, 85], "loop": [16, 18, 84, 87], "pictur": 16, "simplifi": [16, 84], "someth": 16, "spaceship": [16, 26, 39, 70], "land": [16, 33, 66], "safe": [16, 62], "document": [16, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 85, 88], "imagin": [16, 84], "robot": [16, 18, 31, 80, 83, 89], "destroi": [16, 22, 24, 26, 27, 28, 29, 30, 31, 34, 35, 36, 37, 39, 40, 48, 54, 65, 66, 67, 70, 71, 72, 74], "enemi": [16, 23, 24, 27, 29, 30, 31, 37, 39, 40, 42, 55, 64, 65, 67, 68, 70, 71, 72, 74, 80], "exchang": 16, "crash": 16, "succeed": 16, "similarli": 16, "restart": 16, "train": [16, 18, 87], "major": [16, 18], "our": [16, 84, 87, 88], "simpl": [16, 85, 86, 89], "util": [16, 17, 88], "coupl": 16, "nich": 16, "li": [16, 84], "lie": 16, "full": [16, 19, 44, 45, 46, 47, 48], "aspect": [16, 89], "regist": [17, 19], "sole": 17, "appear": [17, 26, 28, 31, 67], "special": [17, 22, 51], "gymv26environ": 17, "pong": [17, 19, 34], "v5": [17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "increas": [17, 40, 68], "backward": 17, "oldv21env": 17, "librari": [18, 84, 85, 86, 88], "briefli": 18, "outlin": [18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "123": 18, "emul": [18, 19], "awar": 18, "randint": 18, "utilis": 18, "compar": [18, 87], "extra": [18, 23, 28, 29, 31, 35, 37, 49, 68, 84, 87, 88], "definit": [18, 89], "reproduct": 18, "expand": [18, 19, 44, 45, 46, 47, 48], "blog": 18, "post": [18, 27], "soon": [18, 88], "publish": 18, "These": [18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 83, 84, 85, 87], "address": 18, "associ": 18, "primarili": 18, "shouldn": [18, 88], "happen": [18, 67, 89], "fly": [18, 21, 26, 49, 65], "shown": [18, 53, 89], "explan": [18, 87], "summari": 18, "goalenv": 18, "reimplement": 18, "system": [18, 48, 84], "monitor": 18, "stella": 19, "licens": [19, 84, 87], "download": [19, 84, 87, 88, 89], "locat": [19, 54, 84, 88], "agre": 19, "todo": 19, "legal": [19, 44, 45, 46, 47, 48], "fire": [19, 21, 23, 24, 26, 27, 30, 32, 34, 35, 44, 45, 46, 47, 48, 51, 58, 59, 61, 62, 64, 65, 67, 68, 71, 72, 74, 76, 78, 79], "upright": [19, 25, 26, 30, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 52, 57], "upleft": [19, 25, 26, 30, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 52, 57], "downright": [19, 25, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 52, 55, 57], "downleft": [19, 25, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 52, 55, 57], "upfir": [19, 23, 26, 32, 44, 45, 46, 47, 48, 62, 74, 75, 76, 78, 79], "11": [19, 26, 44, 45, 46, 47, 48, 52, 55, 87], "rightfir": [19, 21, 23, 24, 26, 27, 30, 35, 44, 45, 46, 47, 48, 52, 55, 58, 59, 61, 71, 74, 75, 78, 79], "leftfir": [19, 21, 23, 24, 26, 27, 35, 44, 45, 46, 47, 48, 52, 55, 58, 59, 61, 71, 74, 75, 78, 79], "13": [19, 26, 44, 45, 46, 47, 48, 52, 55], "downfir": [19, 23, 26, 32, 44, 45, 46, 47, 48, 52, 55, 59, 62, 74, 76, 79], "14": [19, 44, 45, 46, 47, 48, 52, 87], "uprightfir": [19, 26, 44, 45, 46, 47, 48, 52, 55], "upleftfir": [19, 26, 44, 45, 46, 47, 48, 52, 55], "16": [19, 28, 31, 34, 39, 44, 45, 46, 47, 48, 52, 84, 87], "downrightfir": [19, 44, 45, 46, 47, 48, 52, 55], "17": [19, 31, 44, 45, 46, 47, 48, 52], "downleftfir": [19, 44, 45, 46, 47, 48, 52, 55], "smaller": [19, 24, 26, 44, 45, 46, 47, 48], "enumer": [19, 44, 45, 46, 47, 48], "full_action_spac": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "reduc": [19, 21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 38, 40, 41, 42, 43, 44, 45, 46, 47, 48, 52, 55, 57, 58, 59, 61, 62, 64, 69, 71, 72, 74, 75, 76, 78, 79], "difficulti": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84], "choic": 19, "player": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 87], "128": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "byte": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "ram": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "consol": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "exact": [19, 32, 44, 45, 46, 47, 48], "atariag": [19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 73, 75, 76, 77, 78, 79, 80], "determinist": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 88], "art": 19, "memor": 19, "sticki": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "small": [19, 48, 67, 84, 85], "previous": [19, 28], "On": [19, 59], "top": [19, 34, 38, 45, 51, 53, 67, 82, 88], "repeat": 19, "frameskip": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "exclus": 19, "tabl": [19, 22, 23, 25, 38, 40], "obs_typ": 19, "Its": 19, "repeat_action_prob": [19, 44, 45, 46, 47, 48], "stick": [19, 28, 49, 87], "ll": [19, 51, 68, 87], "sound": [19, 84], "lock": 19, "proper": 19, "audio": 19, "framer": [19, 88], "best": [19, 44, 45, 46, 47, 48, 84, 87], "practic": [19, 44, 45, 46, 47, 48, 84, 87, 89], "configur": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 87, 88], "variat": 19, "amidar": [19, 27], "amidardeterminist": 19, "amidarnoframeskip": 19, "ramdeterminist": 19, "ramnoframeskip": 19, "suffix": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "noframeskip": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "adventur": 19, "airraid": [19, 21], "alien": [19, 39, 59, 72], "assault": 19, "asterix": 19, "asteroid": 19, "31": [19, 26], "atlanti": 19, "bankheist": [19, 28], "20": [19, 28, 34, 60, 68, 84, 87], "24": [19, 28, 34, 58], "28": [19, 28, 34], "battlezon": [19, 29], "beamrid": [19, 30], "berzerk": 19, "18": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "bowl": 19, "breakout": 19, "32": [19, 34, 50], "36": [19, 34], "40": [19, 34, 58], "44": [19, 34], "carniv": 19, "centiped": 19, "22": [19, 36, 87], "86": [19, 36], "choppercommand": [19, 37], "crazyclimb": [19, 38], "defend": [19, 27, 42, 58, 70], "demonattack": [19, 40], "doubledunk": [19, 41], "elevatoract": [19, 42], "enduro": 19, "fishingderbi": 19, "freewai": 19, "frostbit": 19, "gopher": 19, "gravitar": 19, "hero": 19, "icehockei": 19, "jamesbond": 19, "journeyescap": 19, "kangaroo": 19, "krull": 19, "kungfumast": [19, 55], "montezumareveng": [19, 56], "mspacman": [19, 57], "namethisgam": [19, 58], "phoenix": 19, "pitfal": 19, "pooyan": 19, "50": [19, 52, 62, 68], "70": [19, 62], "privateey": 19, "qbert": 19, "riverraid": 19, "roadrunn": [19, 66], "robotank": [19, 67], "seaquest": 19, "ski": 19, "solari": 19, "spaceinvad": 19, "stargunn": 19, "tenni": 19, "timepilot": 19, "tutankham": 19, "upndown": [19, 76], "ventur": 19, "videopinbal": [19, 78, 79], "wizardofwor": [19, 79], "yarsreveng": 19, "zaxxon": 19, "oppos": 19, "ai": 19, "mg": 19, "bellemar": 19, "naddaf": 19, "veness": 19, "platform": [19, 84], "journal": 19, "artifici": 19, "intellig": 19, "research": [19, 83, 84], "2012": 19, "url": 19, "jair": 19, "php": 19, "articl": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "view": [19, 48, 84], "11182": 19, "250": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "160": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "enchant": [20, 36], "chalic": 20, "golden": 20, "castl": 20, "pick": [20, 42, 53, 66, 87], "sword": 20, "bridg": [20, 65, 84], "magnet": 20, "fight": [20, 33, 55, 58, 84], "outmanoeuvr": 20, "dragon": 20, "flavor": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "switch": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 84], "thorough": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "discuss": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "intric": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "stochast": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 82, 83, 84], "ship": [21, 22, 24, 30, 39, 48, 70], "sidewai": [21, 24, 30, 65, 69], "protect": [21, 27, 36, 37, 47, 52, 62], "saucer": [21, 26, 72], "try": [21, 22, 23, 32, 34, 38, 61, 62, 87], "drop": [21, 28], "bomb": [21, 39, 51, 59, 72], "meaning": [21, 23, 24, 25, 26, 27, 30, 32, 34, 35, 38, 40, 41, 42, 43, 52, 55, 57, 58, 59, 61, 62, 64, 69, 71, 72, 74, 75, 76, 78, 79], "210": [22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 39, 40, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "stuck": [22, 31, 49], "maze": [22, 23, 28, 31, 56, 75], "egg": 22, "scatter": [22, 63], "simultan": [22, 23], "kill": [22, 31, 49, 54], "flamethrow": 22, "tricki": 22, "situat": 22, "occasion": [22, 26], "power": [22, 49, 84], "pulsar": 22, "temporari": 22, "abil": 22, "score": [22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 49, 50, 51, 52, 53, 54, 60, 61, 62, 63, 64, 65, 66, 68, 72, 73, 74, 78], "prize": [22, 76], "caught": [22, 28], "lose": [22, 25, 27, 36, 38, 39, 42, 49, 51, 60, 61, 63, 65, 66, 68, 69, 70], "consult": [22, 50, 51, 52, 53, 54], "pac": 23, "man": 23, "visit": [23, 42], "grid": [23, 84, 87, 88], "chicken": [23, 35, 45], "catch": [23, 38, 44, 66], "travers": 23, "vehicl": [24, 29, 43, 52, 84], "big": [24, 44, 88], "mother": [24, 53, 62], "circl": [24, 88], "overhead": 24, "deploi": 24, "drone": 24, "dodg": [24, 30, 68], "attack": [24, 26, 27, 30, 39, 62], "horizont": [25, 35, 88], "vertic": [25, 84, 88], "lyre": 25, "guid": [25, 45, 84], "award": [25, 31, 36, 38, 42, 68], "field": [26, 84], "break": [26, 34], "satellit": 26, "ufo": 26, "job": [27, 88], "submerg": 27, "citi": [27, 28, 63, 84], "slowli": 27, "descend": 27, "toward": [27, 50], "strike": [27, 32], "distanc": [27, 43, 88], "defens": [27, 41], "manag": [27, 32], "seven": 27, "fought": 27, "wave": [27, 37, 40, 52, 59, 72], "outer": 27, "robber": 28, "natur": [28, 87], "rob": 28, "getawai": 28, "polic": 28, "chase": [28, 31], "dynamit": [28, 49], "ga": 28, "tank": [28, 29, 68], "nine": 28, "leav": [28, 83, 88], "person": [29, 84], "perspect": [29, 84], "3d": [29, 84, 87], "illus": 29, "radar": [29, 79], "travel": 30, "constant": [30, 68], "steer": [30, 76], "debri": 30, "leftifir": 30, "evil": [31, 55, 80], "touch": [31, 63, 88], "wall": [31, 34, 49], "undefeat": 31, "otto": 31, "tri": 32, "knock": [32, 33], "pin": 32, "spar": 32, "spare": 32, "300": [32, 43, 88], "oppon": [33, 44, 50, 61, 76], "ring": 33, "hit": [33, 34, 35, 36, 40, 62, 63, 66, 67, 69, 87], "punch": [33, 53], "famou": 34, "paddl": [34, 61], "ball": [34, 50, 61, 78], "brick": 34, "wreak": 34, "havoc": 34, "five": [34, 63, 69, 82], "214": 35, "em": 35, "gun": [35, 42], "suppli": [35, 58, 89], "ammunit": 35, "steal": [35, 44], "bullet": [35, 84], "subtract": 35, "minu": 35, "sign": 35, "elf": 36, "magic": 36, "wand": 36, "fend": 36, "spider": 36, "flea": 36, "mushroom": 36, "forest": 36, "bitten": 36, "tempor": 36, "paralyz": 36, "scorpion": 36, "round": 36, "helicopt": [37, 38, 65], "truck": [37, 66], "convoi": 37, "aircraft": [37, 74], "mini": 37, "bottom": [37, 51], "plane": 37, "surviv": [37, 40], "builid": 38, "obstacl": [38, 52, 53], "fall": [38, 40, 60, 66, 89], "damag": [38, 67], "climb": [38, 53, 82, 84], "fast": [38, 83, 84], "least": [38, 73], "row": [38, 71], "earth": [39, 71], "rescu": [39, 49, 53, 54, 55, 68, 70], "smart": 39, "shot": [39, 41, 42, 50, 51, 66, 84], "abduct": 39, "unlimit": 39, "laser": [39, 49, 71, 79], "missil": [39, 65], "aliv": 39, "face": [40, 87], "ic": [40, 46, 50], "planet": [40, 48, 70], "krybor": 40, "accumul": 40, "reserv": [40, 65, 67, 68], "bunker": [40, 48], "grant": 40, "slai": 40, "2v2": 41, "basketbal": 41, "possess": 41, "rival": 41, "team": 41, "rule": [41, 73, 84, 87], "foul": 41, "success": [41, 89], "secret": [42, 63], "ground": [42, 62, 84], "stair": 42, "equip": 42, "against": [42, 61, 73, 84], "floor": 42, "gather": [42, 63, 88], "apart": [42, 88], "mark": 42, "red": [42, 48, 88], "door": [42, 84], "unreleas": 42, "prototyp": 42, "500": [42, 65], "racer": 43, "nation": 43, "long": [43, 78], "endur": 43, "race": [43, 66, 69], "overtak": 43, "dai": [43, 81], "stai": 43, "meet": 43, "quota": 43, "sunfish": 44, "But": [44, 69], "fisherman": 44, "black": [44, 54, 87], "shark": [44, 58, 68], "lurk": [44, 64], "surfac": [44, 68, 88], "lane": [45, 84], "busi": 45, "rush": 45, "hour": 45, "traffic": 45, "cross": 45, "bailei": 46, "who": [46, 47, 52, 53, 69], "hop": [46, 64], "forth": 46, "arctic": 46, "river": [46, 65], "block": [46, 84], "white": 46, "blue": [46, 48, 73, 88], "he": [46, 48], "hi": [46, 48, 63], "igloo": 46, "shovel": 47, "wield": 47, "farmer": 47, "crop": 47, "carrot": 47, "spacecraft": 48, "fiction": 48, "solar": 48, "landscap": 48, "miner": 49, "mine": [49, 66], "shaft": 49, "tool": [49, 56], "propel": 49, "backpack": 49, "wherev": 49, "blast": [49, 68, 70], "beam": 49, "vermin": 49, "raft": 49, "stretch": 49, "critter": 49, "remain": [49, 52, 53, 68, 88, 89], "standard": [50, 84], "hockei": 50, "minut": [50, 60], "period": 50, "puck": 50, "angl": [50, 51], "extrem": [50, 84, 85], "aim": 50, "rink": 50, "realli": [50, 87], "mr": 51, "bond": 51, "design": [51, 85, 88], "multipurpos": 51, "craft": 51, "varieti": [51, 84], "motion": [51, 84], "slightli": 51, "jump": [51, 66, 69], "dive": 51, "lob": 51, "rate": [51, 68, 87], "highest": [51, 84], "novic": 51, "006": 51, "007": 51, "lead": 52, "journei": [52, 87], "peski": 52, "backstag": 52, "scarab": 52, "000": [52, 65, 68], "concert": 52, "cash": 52, "grasp": 52, "groupi": 52, "photograph": 52, "promot": 52, "encount": [52, 53, 74, 84], "her": [53, 62], "preciou": 53, "babi": 53, "ladder": 53, "bonu": [53, 67, 68, 72], "fruit": 53, "monkei": 53, "corner": 53, "beast": 54, "fortress": [54, 56], "princess": [54, 55], "lyssa": 54, "sunris": 54, "monster": [54, 77], "wizard": 55, "templ": 55, "victoria": 55, "defeat": [55, 64], "acquir": [56, 83], "treasur": [56, 58, 60, 75, 77], "chamber": [56, 77], "emperor": 56, "deadli": 56, "creatur": [56, 64, 72, 84], "valuabl": 56, "pellet": 57, "ghost": 57, "discov": 58, "octopu": 58, "ey": [58, 63, 84], "oxygen": [58, 68], "pilot": [59, 80], "elimin": [59, 75, 76, 77], "war": 59, "bird": 59, "harri": 60, "jungl": 60, "die": [60, 62], "misfortun": 60, "hole": 60, "compet": 61, "deflect": 61, "pig": 62, "piglet": 62, "wolv": 62, "rope": 62, "balloon": 62, "guard": 62, "eat": [62, 66], "bait": 62, "wolf": 62, "stone": 62, "rock": [62, 66], "french": 63, "privat": [63, 88], "pierr": 63, "street": 63, "park": 63, "passag": 63, "dead": 63, "search": [63, 84], "ringlead": 63, "henri": 63, "le": 63, "fiend": 63, "gang": 63, "evid": 63, "stolen": 63, "good": [63, 87], "statut": 63, "expir": 63, "nab": 63, "question": [63, 84], "auto": 63, "pothol": 63, "bert": 64, "cube": 64, "pyramid": 64, "destin": 64, "nasti": 64, "jet": 65, "fli": 65, "fuel": [65, 70], "depot": 65, "collid": [65, 68], "bank": 65, "squadron": [65, 67], "tanker": 65, "80": 65, "tm": 66, "direct": [66, 68, 84, 88], "outrun": 66, "wile": 66, "coyot": 66, "hazard": 66, "desert": 66, "rocket": [66, 67], "cannon": [66, 71], "cliff": 66, "steel": 66, "pile": 66, "birdse": 66, "cannonbal": 66, "activ": [67, 88], "scrambl": 67, "static": 67, "interfer": 67, "becom": [67, 81, 84, 89], "sensor": 67, "report": 67, "flash": 67, "panel": 67, "earn": 67, "twelv": 67, "abl": [68, 89], "torpedo": 68, "diver": 68, "killer": 68, "deliv": 68, "six": 68, "explod": 68, "anyth": 68, "decreas": 68, "almost": 68, "yoursub": 68, "blow": 68, "forc": [68, 70], "less": [68, 87], "worth": [68, 71], "90": [68, 87], "moment": 68, "skier": 69, "gate": [69, 84], "fastest": 69, "tree": 69, "slalom": 69, "penalti": 69, "warp": 70, "sector": 70, "feder": [70, 84], "zylon": 70, "refuel": 70, "cadet": 70, "corridor": 70, "invad": 71, "mania": [72, 74], "orang": 73, "win": [73, 87], "margin": 73, "ti": 73, "sport": 73, "till": [73, 87], "technologi": 74, "increasingli": 74, "futur": 74, "difficult": [74, 83], "rack": 75, "tomb": 75, "guardian": 75, "baja": 76, "bugger": 76, "dungeon": 77, "beat": 79, "scanner": 79, "armi": 80, "enslav": 80, "galaxi": 80, "fighter": 80, "toi": [81, 84], "contribut": 81, "earli": [81, 84, 87], "oleg": 81, "klimov": 81, "popular": [81, 84, 87], "benchmark": [81, 84], "ever": 81, "nois": [82, 83], "regard": 82, "underpow": 82, "effort": 82, "easier": 82, "ones": [82, 83], "stand": 83, "joint": 83, "contact": 83, "engin": 83, "facilit": [83, 84], "develop": 83, "biomechan": 83, "graphic": [83, 84], "anim": 83, "area": 83, "accur": [83, 84], "octob": 83, "2021": [83, 84], "deepmind": [83, 84], "2022": 83, "free": [83, 84, 87], "everyon": 83, "instruct": [83, 88], "websit": [83, 84], "framework": 83, "command": 83, "older": 83, "ten": 83, "iverteddoublependulum": 83, "gaussian": 83, "bodi": 83, "mjsim": 83, "qpo": 83, "qvel": 83, "calcul": 83, "indirectli": 83, "xml": 83, "tweak": 83, "doom": 84, "focus": 84, "visual": 84, "thousand": 84, "depth": 84, "annot": [84, 87], "label": [84, 87], "scenario": 84, "come": 84, "2016": 84, "paper": 84, "cite": 84, "clone": [84, 88], "huge": 84, "3v3": 84, "hundr": 84, "roughli": 84, "23": 84, "tweakabl": 84, "onlin": 84, "cost": 84, "monei": 84, "minecraft": 84, "spars": [84, 88], "challeng": [84, 87], "procedur": 84, "measur": 84, "quickli": 84, "generaliz": 84, "skill": 84, "slime": 84, "volleybal": 84, "motiv": 84, "maintain": [84, 86], "premad": 84, "imperfect": 84, "sum": [84, 87], "twisti": 84, "puzzl": 84, "weiqi": 84, "famous": 84, "conquer": 84, "alphago": 84, "synthes": 84, "neuro": 84, "architectur": 84, "integr": 84, "twin": 84, "concept": 84, "seamless": 84, "transfer": 84, "hardwar": 84, "world": 84, "firmwar": 84, "neuroflight": 84, "extens": 84, "ro": 84, "model": [84, 87], "thrust": 84, "ascend": 84, "shall": 84, "altitud": 84, "subject": 84, "vari": 84, "aerodynam": 84, "drag": 84, "graviti": 84, "mass": 84, "light": 84, "poli": 84, "articul": 84, "pinocchio": 84, "meshcat": 84, "web": 84, "minimalist": 84, "interior": 84, "room": 84, "hallwai": 84, "offic": 84, "home": 84, "seen": 84, "dmlab": 84, "bitcraz": 84, "crazyfli": 84, "nanoquadrotor": 84, "mar": 84, "endeavor": 84, "gap": 84, "deep": [84, 89], "methodologi": 84, "coverag": 84, "terrain": 84, "arm": 84, "commerci": 84, "mac": 84, "linux": 84, "applic": 84, "laboratori": 84, "internet": 84, "realist": 84, "virtual": [84, 88], "ego": 84, "front": 84, "camera": 84, "lidar": 84, "cloud": 84, "semant": 84, "cours": 84, "wide": 84, "account": 84, "scheme": 84, "yield": 84, "voltag": 84, "duti": 84, "cycl": 84, "plan": 84, "emphasi": 84, "percept": 84, "social": 84, "driver": 84, "whose": 84, "uncertain": 84, "propos": 84, "merg": 84, "intersect": 84, "roundabout": 84, "longitudin": 84, "comprehens": 84, "conduct": 84, "akin": 84, "anomali": 84, "inject": 84, "studi": 84, "robust": 84, "brax": 84, "friction": 84, "compil": 84, "llvm": 84, "phase": 84, "gcc": 84, "cuda": 84, "hyperparamet": [84, 87], "cheap": 84, "surrog": 84, "evolutionari": 84, "obsolet": 84, "windygrid": 84, "bandit": 84, "server": 84, "advertis": 84, "greedi": [84, 87], "softmax": 84, "ucb1": 84, "trade": 84, "great": [84, 87], "focu": 84, "simplic": 84, "autom": 84, "deduct": 84, "verif": 84, "cell": [84, 88], "minatar": 84, "metatrad": 84, "unus": 84, "techniqu": 84, "hard": 84, "strive": 84, "novel": 84, "transport": 84, "push": 84, "warehous": 84, "storag": 84, "advantag": [84, 88], "overfit": 84, "predefin": [84, 88], "mathemat": 84, "synthesi": 84, "dataset": 84, "arxiv": 84, "ab": 84, "2107": 84, "07373": 84, "baselin": 84, "expos": 84, "na": 84, "blockqnn": 84, "wise": 84, "nsc": 84, "accuraci": 84, "far": 84, "cifar": 84, "meta": 84, "tag": 84, "answer": 84, "classif": 84, "omg": 84, "toolbox": 84, "electron": 84, "musculoskelet": 84, "opensim": 84, "physiolog": 84, "competit": 84, "nip": 84, "2017": 84, "foss": 84, "interoper": 84, "quantum": 84, "circuit": 84, "wire": 84, "qubit": 84, "googl": 84, "quantumai": 84, "cirq": 84, "quadrotor": 84, "casadi": 84, "symbol": 84, "priori": 84, "constraint": 84, "taobao": 84, "largest": 84, "commerc": 84, "morl": 84, "equiti": 84, "market": 84, "acm": 84, "icaif21": 84, "public": 84, "financi": 84, "daili": 84, "investor": 84, "respons": 84, "experiment": 84, "theorem": 84, "prover": 84, "vampir": 84, "theoret": 84, "workshop": 84, "f1tenth": 84, "unoffici": 84, "baselines3": 84, "trackmania": 84, "2020": 84, "latent": 84, "miniatur": 84, "racecar": 84, "portabl": 84, "evolut": 84, "torc": 84, "wireless": 84, "elastica": 84, "assembli": 84, "slender": 84, "cosserat": 84, "rod": 84, "supertuxkart": 84, "accompani": 84, "ostrich": 84, "bio": 84, "mechan": 84, "locomot": 84, "leg": 84, "co": 84, "soft": 84, "neurip": 84, "snake": 84, "propuls": 84, "music": 84, "dual": 84, "dexter": 84, "hand": 84, "manipul": 84, "isaac": 84, "omnivers": 84, "rust": 84, "jax": 84, "henc": 85, "suitabl": 85, "capabl": 86, "casino": 87, "card": 87, "infam": 87, "beatabl": 87, "infinit": [87, 89], "deck": 87, "won": 87, "viabl": 87, "strategi": 87, "greater": 87, "dealer": 87, "approach": [87, 88], "favorit": 87, "solut": 87, "author": 87, "zemann": 87, "mit": 87, "defaultdict": 87, "seaborn": 87, "sn": 87, "pyplot": 87, "plt": 87, "patch": 87, "barto": 87, "sab": 87, "later": 87, "synonym": 87, "usabl": 87, "ac": 87, "bust": 87, "next_stat": 87, "explanatori": 87, "tell": [87, 89], "watch": 87, "idea": [87, 89], "behav": 87, "slow": 87, "showcas": 87, "ons": 87, "respond": 87, "harm": 87, "expor": 87, "percentag": 87, "blackjackag": 87, "lr": 87, "epsilon_decai": 87, "q_valu": 87, "get_act": 87, "greedili": 87, "exploit": 87, "els": [87, 88], "argmax": 87, "old_q_valu": 87, "max_future_q": 87, "decay_epsilon": 87, "readi": 87, "learning_r": 87, "start_epsilon": 87, "n_episod": 87, "200_000": 87, "create_grid": 87, "usable_ac": 87, "action_valu": 87, "meshgrid": 87, "arang": 87, "apply_along_axi": 87, "arr": 87, "dstack": 87, "value_grid": 87, "policy_grid": 87, "create_plot": 87, "figur": 87, "subplot": 87, "fig": 87, "figsiz": 87, "figaspect": 87, "suptitl": 87, "fontsiz": 87, "ax1": 87, "add_subplot": 87, "plot_surfac": 87, "rstride": 87, "cstride": 87, "cmap": 87, "viridi": 87, "edgecolor": 87, "xtick": 87, "ytick": 87, "set_titl": 87, "set_xlabel": 87, "set_ylabel": 87, "zaxi": 87, "set_rotate_label": 87, "set_zlabel": 87, "rotat": 87, "view_init": 87, "220": 87, "ax2": 87, "heatmap": 87, "linewidth": 87, "accent_r": 87, "cbar": 87, "set_xticklabel": 87, "set_yticklabel": 87, "legend": 87, "legend_el": 87, "facecolor": 87, "lightgreen": 87, "grei": 87, "bbox_to_anchor": 87, "fig1": 87, "With": 87, "fig2": 87, "hopefulli": 87, "grip": 87, "mont": 87, "carlo": 87, "book": 87, "fun": 87, "blackjack_tutori": 87, "jupyt": [87, 88, 89], "ipynb": [87, 88, 89], "overview": 88, "relev": 88, "git": 88, "venv": 88, "bin": 88, "concern": 88, "readm": 88, "setup": 88, "gym_exampl": 88, "grid_world": 88, "relative_posit": 88, "reacher_weighted_reward": 88, "discrete_act": 88, "clip_reward": 88, "illustr": [88, 89], "simplist": 88, "gridworldenv": 88, "movement": 88, "piec": 88, "abstract": 88, "window_s": 88, "512": 88, "encod": 88, "walk": 88, "_action_to_direct": 88, "assert": 88, "clock": 88, "_get_ob": 88, "translat": 88, "mandatori": 88, "_agent_loc": 88, "_target_loc": 88, "manhattan": 88, "_get_info": 88, "oftentim": 88, "worri": 88, "coincid": 88, "earlier": 88, "array_equ": 88, "_render_fram": 88, "trivial": 88, "skeleton": 88, "init": 88, "set_mod": 88, "canva": 88, "pix_square_s": 88, "rect": 88, "gridlin": 88, "width": 88, "visibl": 88, "blit": 88, "get_rect": 88, "pump": 88, "delai": 88, "stabl": 88, "tick": 88, "surfarrai": 88, "pixels3d": 88, "bother": 88, "detect": 88, "put": 88, "registr": 88, "appropri": 88, "entrypoint": 88, "mere": 88, "explicitli": [88, 89], "third": 88, "parti": 88, "codebas": 88, "edit": 88, "setuptool": 88, "install_requir": 88, "local": 88, "perfectli": 88, "fine": 88, "variant": 88, "did": 89, "failur": 89, "notabl": 89, "inher": 89, "preserv": 89, "obviou": 89, "forev": 89, "forcibli": 89, "halt": 89, "estim": 89, "formal": 89, "q_": 89, "o_t": 89, "a_t": 89, "r_t": 89, "max_a": 89, "o_": 89, "a_": 89, "q_target": 89, "distinct": 89, "frequent": 89, "differenti": 89, "vf_target": 89, "vf_next_stat": 89, "onward": 89, "handling_time_limit": 89}, "objects": {"Space": [[4, 0, 1, "", "dtype"]], "": [[10, 1, 1, "", "action_space"], [10, 1, 1, "", "observation_space"], [10, 1, 1, "", "single_action_space"], [10, 1, 1, "", "single_observation_space"]], "gymnasium": [[12, 2, 1, "", "ActionWrapper"], [2, 2, 1, "", "Env"], [14, 2, 1, "", "ObservationWrapper"], [15, 2, 1, "", "RewardWrapper"], [11, 2, 1, "", "Wrapper"], [3, 3, 1, "", "make"], [3, 3, 1, "", "register"], [3, 3, 1, "", "spec"]], "gymnasium.ActionWrapper.ActionWrapper": [[12, 3, 1, "", "action"]], "gymnasium.Env": [[2, 1, 1, "", "action_space"], [2, 3, 1, "", "close"], [2, 1, 1, "", "metadata"], [2, 0, 1, "", "np_random"], [2, 1, 1, "", "observation_space"], [2, 3, 1, "", "render"], [2, 1, 1, "", "render_mode"], [2, 3, 1, "", "reset"], [2, 1, 1, "", "reward_range"], [2, 1, 1, "", "spec"], [2, 3, 1, "", "step"], [2, 0, 1, "", "unwrapped"]], "gymnasium.ObservationWrapper": [[14, 3, 1, "", "observation"]], "gymnasium.RewardWrapper.RewardWrapper": [[15, 3, 1, "", "reward"]], "gymnasium.Wrapper": [[11, 0, 1, "", "action_space"], [11, 3, 1, "", "close"], [11, 0, 1, "", "metadata"], [11, 0, 1, "", "np_random"], [11, 0, 1, "", "observation_space"], [11, 3, 1, "", "reset"], [11, 0, 1, "", "reward_range"], [11, 0, 1, "", "spec"], [11, 3, 1, "", "step"], [11, 0, 1, "", "unwrapped"]], "gymnasium.spaces": [[6, 2, 1, "", "Box"], [5, 2, 1, "", "Dict"], [6, 2, 1, "", "Discrete"], [5, 2, 1, "", "Graph"], [6, 2, 1, "", "MultiBinary"], [6, 2, 1, "", "MultiDiscrete"], [5, 2, 1, "", "Sequence"], [4, 2, 1, "", "Space"], [6, 2, 1, "", "Text"], [5, 2, 1, "", "Tuple"]], "gymnasium.spaces.Box": [[6, 4, 1, "", "is_bounded"], [6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Dict": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.Discrete": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Graph": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.MultiBinary": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.MultiDiscrete": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Sequence": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.Text": [[6, 4, 1, "", "sample"], [6, 4, 1, "", "seed"]], "gymnasium.spaces.Tuple": [[5, 4, 1, "", "sample"], [5, 4, 1, "", "seed"]], "gymnasium.spaces.space.Space": [[4, 3, 1, "", "contains"], [4, 3, 1, "", "from_jsonable"], [4, 3, 1, "", "sample"], [4, 3, 1, "", "seed"], [4, 0, 1, "", "shape"], [4, 3, 1, "", "to_jsonable"]], "gymnasium.spaces.utils": [[7, 3, 1, "", "flatdim"], [7, 3, 1, "", "flatten"], [7, 3, 1, "", "flatten_space"], [7, 3, 1, "", "unflatten"]], "gymnasium.utils.env_checker": [[9, 3, 1, "", "check_env"]], "gymnasium.utils.play": [[9, 2, 1, "", "PlayPlot"], [9, 2, 1, "", "PlayableGame"], [9, 3, 1, "", "play"]], "gymnasium.utils.play.PlayPlot": [[9, 4, 1, "", "callback"]], "gymnasium.utils.play.PlayableGame": [[9, 4, 1, "", "process_event"]], "gymnasium.utils.save_video": [[9, 3, 1, "", "capped_cubic_video_schedule"], [9, 3, 1, "", "save_video"]], "gymnasium.utils.seeding": [[9, 3, 1, "", "np_random"]], "gymnasium.utils.step_api_compatibility": [[9, 3, 1, "", "convert_to_done_step_api"], [9, 3, 1, "", "convert_to_terminated_truncated_step_api"], [9, 3, 1, "", "step_api_compatibility"]], "gymnasium.vector": [[10, 2, 1, "", "AsyncVectorEnv"], [10, 2, 1, "", "SyncVectorEnv"], [10, 2, 1, "", "VectorEnv"], [10, 3, 1, "", "make"]], "gymnasium.vector.VectorEnv": [[10, 4, 1, "", "close"], [10, 4, 1, "", "reset"], [10, 4, 1, "", "step"]], "gymnasium.vector.utils": [[8, 3, 1, "", "batch_space"], [8, 3, 1, "", "concatenate"], [8, 3, 1, "", "create_empty_array"], [8, 3, 1, "", "create_shared_memory"], [8, 3, 1, "", "iterate"], [8, 3, 1, "", "read_from_shared_memory"], [8, 3, 1, "", "write_to_shared_memory"]], "gymnasium.wrappers": [[13, 2, 1, "", "AtariPreprocessing"], [13, 2, 1, "", "AutoResetWrapper"], [12, 2, 1, "", "ClipAction"], [13, 2, 1, "", "EnvCompatibility"], [14, 2, 1, "", "FilterObservation"], [14, 2, 1, "", "FlattenObservation"], [14, 2, 1, "", "FrameStack"], [14, 2, 1, "", "GrayScaleObservation"], [13, 2, 1, "", "HumanRendering"], [14, 2, 1, "", "NormalizeObservation"], [15, 2, 1, "", "NormalizeReward"], [13, 2, 1, "", "OrderEnforcing"], [13, 2, 1, "", "PassiveEnvChecker"], [14, 2, 1, "", "PixelObservationWrapper"], [13, 2, 1, "", "RecordEpisodeStatistics"], [13, 2, 1, "", "RecordVideo"], [13, 2, 1, "", "RenderCollection"], [12, 2, 1, "", "RescaleAction"], [14, 2, 1, "", "ResizeObservation"], [13, 2, 1, "", "StepAPICompatibility"], [14, 2, 1, "", "TimeAwareObservation"], [13, 2, 1, "", "TimeLimit"], [14, 2, 1, "", "TransformObservation"], [15, 2, 1, "", "TransformReward"], [13, 2, 1, "", "VectorListInfo"]]}, "objtypes": {"0": "py:property", "1": "py:attribute", "2": "py:class", "3": "py:function", "4": "py:method"}, "objnames": {"0": ["py", "property", "Python property"], "1": ["py", "attribute", "Python attribute"], "2": ["py", "class", "Python class"], "3": ["py", "function", "Python function"], "4": ["py", "method", "Python method"]}, "titleterms": {"404": 0, "page": [0, 1], "Not": 0, "found": 0, "The": [0, 84], "request": 0, "could": 0, "gymnasium": [1, 2, 10, 11, 86, 88], "doc": 1, "instruct": 1, "modifi": [1, 16], "environ": [1, 2, 3, 9, 10, 13, 16, 17, 18, 84, 86, 87, 88], "edit": 1, "an": [1, 87], "ad": 1, "new": [1, 9], "atari": [1, 13, 19], "env": [1, 2, 10, 84, 88], "non": 1, "other": [1, 84], "step": [1, 9, 17, 18], "build": [1, 87], "document": 1, "write": 1, "tutori": 1, "method": [2, 4, 10, 11], "attribut": [2, 4, 10, 11], "addit": 2, "implement": [2, 11], "registri": 3, "make": [3, 10, 88], "regist": [3, 88], "all": 3, "spec": 3, "space": [4, 5, 6, 7, 8, 16, 19, 44, 45, 46, 47, 48], "fundament": [4, 6], "composit": [4, 5], "util": [4, 7, 8, 9], "vector": [4, 8, 10, 13], "dict": 5, "tupl": 5, "sequenc": 5, "graph": 5, "box": [6, 33], "discret": 6, "multibinari": 6, "multidiscret": 6, "text": [6, 85], "share": 8, "memori": 8, "visual": [9, 87], "save": 9, "render": [9, 13, 18], "video": [9, 13, 78, 84], "old": 9, "api": [9, 17, 86], "compat": [9, 13, 17], "seed": [9, 18], "check": 9, "vectorenv": 10, "async": 10, "sync": 10, "wrapper": [11, 12, 13, 14, 15, 88], "custom": [11, 88], "action": [12, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 87], "clip": 12, "rescal": 12, "misc": 13, "preprocess": 13, "autoreset": 13, "passiv": 13, "checker": 13, "human": 13, "order": 13, "enforc": 13, "record": 13, "episod": 13, "statist": 13, "collect": [13, 86], "time": [13, 14, 89], "limit": [13, 89], "list": 13, "info": 13, "observ": [14, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 87], "transform": [14, 15], "filter": 14, "flatten": 14, "framestack": 14, "grai": 14, "scale": 14, "normal": [14, 15], "pixel": 14, "resiz": 14, "awar": 14, "reward": [15, 19, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74], "basic": 16, "usag": 16, "initi": [16, 88], "interact": 16, "explain": 16, "code": [16, 18, 89], "more": 16, "inform": 16, "gym": [17, 84], "load": 17, "openai": [17, 84], "v0": 17, "22": 17, "v21": 18, "v26": 18, "migrat": 18, "guid": 18, "exampl": 18, "random": 18, "number": 18, "gener": 18, "reset": 18, "remov": 18, "autorom": 19, "instal": 19, "rom": 19, "stochast": 19, "common": 19, "argument": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "version": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "histori": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "name": [19, 58], "scheme": 19, "flavor": 19, "refer": [19, 86], "adventur": 20, "descript": [20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80], "air": 21, "raid": 21, "alien": 22, "amidar": 23, "assault": 24, "asterix": 25, "asteroid": 26, "atlanti": 27, "bank": 28, "heist": 28, "battl": 29, "zone": 29, "beam": 30, "rider": 30, "berzerk": 31, "bowl": 32, "breakout": 34, "carniv": 35, "centiped": 36, "chopper": 37, "command": 37, "crazi": 38, "climber": 38, "defend": 39, "demon": 40, "attack": 40, "doubl": 41, "dunk": 41, "elev": 42, "enduro": 43, "fishingderbi": 44, "freewai": 45, "frostbit": 46, "gopher": 47, "gravitar": 48, "hero": 49, "icehockei": 50, "jamesbond": 51, "journeyescap": 52, "kangaroo": 53, "krull": 54, "kung": 55, "fu": 55, "master": 55, "montezuma": 56, "reveng": 56, "m": 57, "pacman": 57, "thi": 58, "game": [58, 84], "phoenix": 59, "pitfal": 60, "pong": 61, "pooyan": 62, "privateey": 63, "qbert": 64, "riverraid": 65, "road": 66, "runner": 66, "robot": [67, 84], "tank": 67, "seaquest": 68, "ski": 69, "solari": 70, "spaceinvad": 71, "stargunn": 72, "tenni": 73, "timepilot": 74, "tutankham": 75, "up": 76, "n": 76, "down": 76, "ventur": 77, "pinbal": 78, "wizard": 79, "wor": 79, "zaxxon": 80, "box2d": 81, "classic": [82, 84], "control": [82, 84], "mujoco": 83, "third": 84, "parti": 84, "vizdoom": 84, "flappi": 84, "bird": 84, "A": 84, "derk": 84, "gpu": 84, "acceler": 84, "moba": 84, "minerl": 84, "procgen": 84, "slimevolleygym": 84, "simpl": 84, "singl": 84, "multi": 84, "agent": [84, 87], "reinforc": [84, 86], "learn": [84, 86, 87, 89], "stabl": 84, "retro": 84, "uniti": 84, "ml": 84, "board": 84, "card": 84, "etc": 84, "abalon": 84, "two": 84, "player": 84, "abstract": 84, "strategi": 84, "spoof": 84, "xiangqi": 84, "chines": 84, "chess": 84, "rubikscubegym": 84, "gymgo": 84, "gymfc": 84, "flight": 84, "tune": 84, "train": 84, "framework": 84, "gazebo": 84, "goddard": 84, "": 84, "rocket": 84, "problem": 84, "jimini": 84, "miniworld": 84, "pybullet": 84, "drone": 84, "marsexplor": 84, "panda": 84, "robo": 84, "offworld": 84, "autonom": 84, "drive": 84, "traffic": 84, "carla": 84, "duckietown": 84, "electr": 84, "motor": 84, "highwai": 84, "longicontrol": 84, "sumo": 84, "rl": 84, "commonroad": 84, "pettingzoo": 84, "anomalous_rl_env": 84, "carl": 84, "compilergym": 84, "dacbench": 84, "gridworld": 84, "adserv": 84, "algorithm": 84, "anytrad": 84, "autokei": 84, "ccc": 84, "cellular": 84, "automata": 84, "inventori": 84, "maze": 84, "mtsim": 84, "legaci": 84, "toytext": 84, "riverswim": 84, "recsi": 84, "sokoban": 84, "math": 84, "prog": 84, "synth": 84, "nasgym": 84, "nlpgym": 84, "toolkit": 84, "develop": 84, "solv": [84, 87], "nlp": 84, "task": 84, "obstacl": 84, "tower": 84, "openmodelica": 84, "microgrid": 84, "osim": 84, "pge": 84, "parallel": 84, "engin": 84, "qasgym": 84, "safe": 84, "virtualtaobao": 84, "mo": 84, "abid": 84, "satur": 84, "shinrl": 84, "race": 84, "go": 84, "explor": 84, "tmrl": 84, "racing_dream": 84, "racecar_gym": 84, "evogym": 84, "design": 84, "tool": 84, "l2r": 84, "gym_torc": 84, "mobil": 84, "softrobot": 84, "pyelastica": 84, "tuxkart": 84, "ai": 84, "ostrichrl": 84, "quadrup": 84, "pogo": 84, "stick": 84, "jump": 84, "igibson": 84, "snakerl": 84, "starship": 84, "land": 84, "raveforc": 84, "line": 84, "follow": 84, "dexteroushand": 84, "omniisaacgymenv": 84, "border": 84, "spacerobotenv": 84, "gymnax": 84, "toi": 85, "i": 86, "standard": 86, "divers": 86, "blackjack": 87, "q": 87, "import": [87, 89], "setup": 87, "execut": 87, "result": 87, "your": 88, "own": 88, "subclass": 88, "declar": 88, "creat": 88, "packag": 88, "instanc": 88, "us": 88, "handl": 89, "termin": 89, "truncat": 89, "solut": 89}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 8, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx": 57}, "alltitles": {"404 - Page Not Found": [[0, "page-not-found"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Gymnasium-docs": [[1, "gymnasium-docs"]], "Instructions for modifying environment pages": [[1, "instructions-for-modifying-environment-pages"]], "Editing an environment page": [[1, "editing-an-environment-page"]], "Adding a new environment": [[1, "adding-a-new-environment"]], "Atari env": [[1, "atari-env"]], "Non-Atari env": [[1, "non-atari-env"]], "Other steps": [[1, "other-steps"]], "Build the Documentation": [[1, "build-the-documentation"]], "Writing Tutorials": [[1, "writing-tutorials"]], "Env": [[2, "env"]], "gymnasium.Env": [[2, "gymnasium-env"]], "Methods": [[2, "methods"], [4, "methods"], [10, "methods"], [11, "methods"]], "Attributes": [[2, "attributes"], [4, "attributes"], [10, "attributes"], [11, "attributes"]], "Additional Methods": [[2, "additional-methods"]], "Implementing environments": [[2, "implementing-environments"]], "Registry": [[3, "registry"]], "Make": [[3, "make"]], "Register": [[3, "register"]], "All registered environments": [[3, "all-registered-environments"]], "Spec": [[3, "spec"]], "Spaces": [[4, "spaces"]], "Fundamental Spaces": [[4, "fundamental-spaces"], [6, "fundamental-spaces"]], "Composite Spaces": [[4, "composite-spaces"], [5, "composite-spaces"]], "Utils": [[4, "utils"], [9, "utils"]], "Vector Utils": [[4, "vector-utils"]], "Dict": [[5, "dict"]], "Tuple": [[5, "tuple"]], "Sequence": [[5, "sequence"]], "Graph": [[5, "graph"]], "Box": [[6, "box"]], "Discrete": [[6, "discrete"]], "MultiBinary": [[6, "multibinary"]], "MultiDiscrete": [[6, "multidiscrete"]], "Text": [[6, "text"]], "Spaces Utils": [[7, "spaces-utils"]], "Spaces Vector Utils": [[8, "spaces-vector-utils"]], "Shared Memory Utils": [[8, "shared-memory-utils"]], "Visualization": [[9, "visualization"]], "Save Rendering Videos": [[9, "save-rendering-videos"]], "Old to New Step API Compatibility": [[9, "old-to-new-step-api-compatibility"]], "Seeding": [[9, "seeding"]], "Environment Checking": [[9, "environment-checking"]], "Vector": [[10, "vector"]], "Gymnasium.vector.VectorEnv": [[10, "gymnasium-vector-vectorenv"]], "Making Vector Environments": [[10, "making-vector-environments"]], "Async Vector Env": [[10, "async-vector-env"]], "Sync Vector Env": [[10, "sync-vector-env"]], "Wrappers": [[11, "wrappers"]], "gymnasium.Wrapper": [[11, "gymnasium-wrapper"]], "Gymnasium Wrappers": [[11, "gymnasium-wrappers"]], "Implementing a custom wrapper": [[11, "implementing-a-custom-wrapper"]], "Action Wrappers": [[12, "action-wrappers"]], "Action Wrapper": [[12, "action-wrapper"]], "Clip Action": [[12, "clip-action"]], "Rescale Action": [[12, "rescale-action"]], "Misc Wrappers": [[13, "misc-wrappers"]], "Atari Preprocessing": [[13, "atari-preprocessing"]], "Autoreset": [[13, "autoreset"]], "Compatibility": [[13, "compatibility"]], "Passive Environment Checker": [[13, "passive-environment-checker"]], "Human Rendering": [[13, "human-rendering"]], "Order Enforcing": [[13, "order-enforcing"]], "Record Episode Statistics": [[13, "record-episode-statistics"]], "Record Video": [[13, "record-video"]], "Render Collection": [[13, "render-collection"]], "Time Limit": [[13, "time-limit"]], "Vector List Info": [[13, "vector-list-info"]], "Observation Wrappers": [[14, "observation-wrappers"]], "Observation Wrapper": [[14, "observation-wrapper"]], "Transform Observation": [[14, "transform-observation"]], "Filter Observation": [[14, "filter-observation"]], "Flatten Observation": [[14, "flatten-observation"]], "Framestack Observations": [[14, "framestack-observations"]], "Gray Scale Observation": [[14, "gray-scale-observation"]], "Normalize Observation": [[14, "normalize-observation"]], "Pixel Observation Wrapper": [[14, "pixel-observation-wrapper"]], "Resize Observation": [[14, "resize-observation"]], "Time Aware Observation": [[14, "time-aware-observation"]], "Reward Wrappers": [[15, "reward-wrappers"]], "Reward Wrapper": [[15, "reward-wrapper"]], "Transform Reward": [[15, "transform-reward"]], "Normalize Reward": [[15, "normalize-reward"]], "Basic Usage": [[16, "basic-usage"]], "Initializing Environments": [[16, "initializing-environments"]], "Interacting with the Environment": [[16, "interacting-with-the-environment"]], "Explaining the code": [[16, "explaining-the-code"]], "Action and observation spaces": [[16, "action-and-observation-spaces"]], "Modifying the environment": [[16, "modifying-the-environment"]], "More information": [[16, "more-information"]], "Compatibility with Gym": [[17, "compatibility-with-gym"]], "Loading OpenAI Gym environments": [[17, "loading-openai-gym-environments"]], "Gym v0.22 Environment Compatibility": [[17, "gym-v0-22-environment-compatibility"]], "Step API Compatibility": [[17, "step-api-compatibility"]], "v21 to v26 Migration Guide": [[18, "v21-to-v26-migration-guide"]], "Example code for v21": [[18, "example-code-for-v21"]], "Example code for v26": [[18, "example-code-for-v26"]], "Seed and random number generator": [[18, "seed-and-random-number-generator"]], "Environment Reset": [[18, "environment-reset"]], "Environment Step": [[18, "environment-step"]], "Environment Render": [[18, "environment-render"]], "Removed code": [[18, "removed-code"]], "Atari": [[19, "atari"]], "AutoROM (installing the ROMs)": [[19, "autorom-installing-the-roms"]], "Action Space": [[19, "action-space"], [44, "action-space"], [45, "action-space"], [46, "action-space"], [47, "action-space"], [48, "action-space"]], "Observation Space": [[19, "observation-space"]], "Rewards": [[19, "rewards"], [22, "rewards"], [23, "rewards"], [25, "rewards"], [26, "rewards"], [27, "rewards"], [28, "rewards"], [29, "rewards"], [30, "rewards"], [31, "rewards"], [32, "rewards"], [33, "rewards"], [34, "rewards"], [35, "rewards"], [36, "rewards"], [37, "rewards"], [38, "rewards"], [39, "rewards"], [40, "rewards"], [41, "rewards"], [42, "rewards"], [43, "rewards"], [44, "rewards"], [45, "rewards"], [46, "rewards"], [47, "rewards"], [48, "rewards"], [49, "rewards"], [50, "rewards"], [51, "rewards"], [52, "rewards"], [53, "rewards"], [54, "rewards"], [60, "rewards"], [61, "rewards"], [62, "rewards"], [63, "rewards"], [64, "rewards"], [65, "rewards"], [66, "rewards"], [67, "rewards"], [68, "rewards"], [69, "rewards"], [70, "rewards"], [71, "rewards"], [72, "rewards"], [73, "rewards"], [74, "rewards"]], "Stochasticity": [[19, "stochasticity"]], "Common Arguments": [[19, "common-arguments"]], "Version History and Naming Schemes": [[19, "version-history-and-naming-schemes"]], "Flavors": [[19, "flavors"]], "References": [[19, "references"]], "Adventure": [[20, "adventure"]], "Description": [[20, "description"], [21, "description"], [22, "description"], [23, "description"], [24, "description"], [25, "description"], [26, "description"], [27, "description"], [28, "description"], [29, "description"], [30, "description"], [31, "description"], [32, "description"], [33, "description"], [34, "description"], [35, "description"], [36, "description"], [37, "description"], [38, "description"], [39, "description"], [40, "description"], [41, "description"], [42, "description"], [43, "description"], [44, "description"], [45, "description"], [46, "description"], [47, "description"], [48, "description"], [49, "description"], [50, "description"], [51, "description"], [52, "description"], [53, "description"], [54, "description"], [55, "description"], [56, "description"], [57, "description"], [58, "description"], [59, "description"], [60, "description"], [61, "description"], [62, "description"], [63, "description"], [64, "description"], [65, "description"], [66, "description"], [67, "description"], [68, "description"], [69, "description"], [70, "description"], [71, "description"], [72, "description"], [73, "description"], [74, "description"], [75, "description"], [76, "description"], [77, "description"], [78, "description"], [79, "description"], [80, "description"]], "Actions": [[20, "actions"], [21, "actions"], [22, "actions"], [23, "actions"], [24, "actions"], [25, "actions"], [26, "actions"], [27, "actions"], [28, "actions"], [29, "actions"], [30, "actions"], [31, "actions"], [32, "actions"], [33, "actions"], [34, "actions"], [35, "actions"], [36, "actions"], [37, "actions"], [38, "actions"], [39, "actions"], [40, "actions"], [41, "actions"], [42, "actions"], [43, "actions"], [49, "actions"], [50, "actions"], [51, "actions"], [52, "actions"], [53, "actions"], [54, "actions"], [55, "actions"], [56, "actions"], [57, "actions"], [58, "actions"], [59, "actions"], [60, "actions"], [61, "actions"], [62, "actions"], [63, "actions"], [64, "actions"], [65, "actions"], [66, "actions"], [67, "actions"], [68, "actions"], [69, "actions"], [70, "actions"], [71, "actions"], [72, "actions"], [73, "actions"], [74, "actions"], [75, "actions"], [76, "actions"], [77, "actions"], [78, "actions"], [79, "actions"], [80, "actions"]], "Observations": [[20, "observations"], [21, "observations"], [22, "observations"], [23, "observations"], [24, "observations"], [25, "observations"], [26, "observations"], [27, "observations"], [28, "observations"], [29, "observations"], [30, "observations"], [31, "observations"], [32, "observations"], [33, "observations"], [34, "observations"], [35, "observations"], [36, "observations"], [37, "observations"], [38, "observations"], [39, "observations"], [40, "observations"], [41, "observations"], [42, "observations"], [43, "observations"], [44, "observations"], [45, "observations"], [46, "observations"], [47, "observations"], [48, "observations"], [49, "observations"], [50, "observations"], [51, "observations"], [52, "observations"], [53, "observations"], [54, "observations"], [55, "observations"], [56, "observations"], [57, "observations"], [58, "observations"], [59, "observations"], [60, "observations"], [61, "observations"], [62, "observations"], [63, "observations"], [64, "observations"], [65, "observations"], [66, "observations"], [67, "observations"], [68, "observations"], [69, "observations"], [70, "observations"], [71, "observations"], [72, "observations"], [73, "observations"], [74, "observations"], [75, "observations"], [76, "observations"], [77, "observations"], [78, "observations"], [79, "observations"], [80, "observations"]], "Arguments": [[20, "arguments"], [21, "arguments"], [22, "arguments"], [23, "arguments"], [24, "arguments"], [25, "arguments"], [26, "arguments"], [27, "arguments"], [28, "arguments"], [29, "arguments"], [30, "arguments"], [31, "arguments"], [32, "arguments"], [33, "arguments"], [34, "arguments"], [35, "arguments"], [36, "arguments"], [37, "arguments"], [38, "arguments"], [39, "arguments"], [40, "arguments"], [41, "arguments"], [42, "arguments"], [43, "arguments"], [44, "arguments"], [45, "arguments"], [46, "arguments"], [47, "arguments"], [48, "arguments"], [49, "arguments"], [50, "arguments"], [51, "arguments"], [52, "arguments"], [53, "arguments"], [54, "arguments"], [55, "arguments"], [56, "arguments"], [57, "arguments"], [58, "arguments"], [59, "arguments"], [60, "arguments"], [61, "arguments"], [62, "arguments"], [63, "arguments"], [64, "arguments"], [65, "arguments"], [66, "arguments"], [67, "arguments"], [68, "arguments"], [69, "arguments"], [70, "arguments"], [71, "arguments"], [72, "arguments"], [73, "arguments"], [74, "arguments"], [75, "arguments"], [76, "arguments"], [77, "arguments"], [78, "arguments"], [79, "arguments"], [80, "arguments"]], "Version History": [[20, "version-history"], [21, "version-history"], [22, "version-history"], [23, "version-history"], [24, "version-history"], [25, "version-history"], [26, "version-history"], [27, "version-history"], [28, "version-history"], [29, "version-history"], [30, "version-history"], [31, "version-history"], [32, "version-history"], [33, "version-history"], [34, "version-history"], [35, "version-history"], [36, "version-history"], [37, "version-history"], [38, "version-history"], [39, "version-history"], [40, "version-history"], [41, "version-history"], [42, "version-history"], [43, "version-history"], [44, "version-history"], [45, "version-history"], [46, "version-history"], [47, "version-history"], [48, "version-history"], [49, "version-history"], [50, "version-history"], [51, "version-history"], [52, "version-history"], [53, "version-history"], [54, "version-history"], [55, "version-history"], [56, "version-history"], [57, "version-history"], [58, "version-history"], [59, "version-history"], [60, "version-history"], [61, "version-history"], [62, "version-history"], [63, "version-history"], [64, "version-history"], [65, "version-history"], [66, "version-history"], [67, "version-history"], [68, "version-history"], [69, "version-history"], [70, "version-history"], [71, "version-history"], [72, "version-history"], [73, "version-history"], [74, "version-history"], [75, "version-history"], [76, "version-history"], [77, "version-history"], [78, "version-history"], [79, "version-history"], [80, "version-history"]], "Air Raid": [[21, "air-raid"]], "Alien": [[22, "alien"]], "Amidar": [[23, "amidar"]], "Assault": [[24, "assault"]], "Asterix": [[25, "asterix"]], "Asteroids": [[26, "asteroids"]], "Atlantis": [[27, "atlantis"]], "Bank Heist": [[28, "bank-heist"]], "Battle Zone": [[29, "battle-zone"]], "Beam Rider": [[30, "beam-rider"]], "Berzerk": [[31, "berzerk"]], "Bowling": [[32, "bowling"]], "Boxing": [[33, "boxing"]], "Breakout": [[34, "breakout"]], "Carnival": [[35, "carnival"]], "Centipede": [[36, "centipede"]], "Chopper Command": [[37, "chopper-command"]], "Crazy Climber": [[38, "crazy-climber"]], "Defender": [[39, "defender"]], "Demon Attack": [[40, "demon-attack"]], "Double Dunk": [[41, "double-dunk"]], "Elevator Action": [[42, "elevator-action"]], "Enduro": [[43, "enduro"]], "FishingDerby": [[44, "fishingderby"]], "Freeway": [[45, "freeway"]], "Frostbite": [[46, "frostbite"]], "Gopher": [[47, "gopher"]], "Gravitar": [[48, "gravitar"]], "Hero": [[49, "hero"]], "IceHockey": [[50, "icehockey"]], "Jamesbond": [[51, "jamesbond"]], "JourneyEscape": [[52, "journeyescape"]], "Kangaroo": [[53, "kangaroo"]], "Krull": [[54, "krull"]], "Kung Fu Master": [[55, "kung-fu-master"]], "Montezuma Revenge": [[56, "montezuma-revenge"]], "Ms Pacman": [[57, "ms-pacman"]], "Name This Game": [[58, "name-this-game"]], "Phoenix": [[59, "phoenix"]], "Pitfall": [[60, "pitfall"]], "Pong": [[61, "pong"]], "Pooyan": [[62, "pooyan"]], "PrivateEye": [[63, "privateeye"]], "Qbert": [[64, "qbert"]], "Riverraid": [[65, "riverraid"]], "Road Runner": [[66, "road-runner"]], "Robot Tank": [[67, "robot-tank"]], "Seaquest": [[68, "seaquest"]], "Skiings": [[69, "skiings"]], "Solaris": [[70, "solaris"]], "SpaceInvaders": [[71, "spaceinvaders"]], "StarGunner": [[72, "stargunner"]], "Tennis": [[73, "tennis"]], "TimePilot": [[74, "timepilot"]], "Tutankham": [[75, "tutankham"]], "Up n\u2019 Down": [[76, "up-n-down"]], "Venture": [[77, "venture"]], "Video Pinball": [[78, "video-pinball"]], "Wizard of Wor": [[79, "wizard-of-wor"]], "Zaxxon": [[80, "zaxxon"]], "Box2D": [[81, "box2d"]], "Classic Control": [[82, "classic-control"]], "MuJoCo": [[83, "mujoco"]], "Third-Party Environments": [[84, "third-party-environments"]], "Video Game Environments": [[84, "video-game-environments"]], "ViZDoom": [[84, "vizdoom"]], " flappy-bird-gym: A Flappy Bird environment for OpenAI Gym": [[84, "flappy-bird-gym-a-flappy-bird-environment-for-openai-gym"]], " gym-derk: GPU accelerated MOBA environment": [[84, "gym-derk-gpu-accelerated-moba-environment"]], " MineRL": [[84, "minerl"]], " Procgen": [[84, "procgen"]], " SlimeVolleyGym: A simple environment for single and multi-agent reinforcement learning": [[84, "slimevolleygym-a-simple-environment-for-single-and-multi-agent-reinforcement-learning"]], " stable-retro": [[84, "stable-retro"]], " Unity ML Agents": [[84, "unity-ml-agents"]], "Classic Environments (board, card, etc. games)": [[84, "classic-environments-board-card-etc-games"]], " gym-abalone: A two-player abstract strategy board game": [[84, "gym-abalone-a-two-player-abstract-strategy-board-game"]], " gym-spoof": [[84, "gym-spoof"]], " gym-xiangqi: Xiangqi - The Chinese Chess Game": [[84, "gym-xiangqi-xiangqi-the-chinese-chess-game"]], " RubiksCubeGym": [[84, "rubikscubegym"]], " GymGo": [[84, "gymgo"]], "Robotics Environments": [[84, "robotics-environments"]], " GymFC: A flight control tuning and training framework": [[84, "gymfc-a-flight-control-tuning-and-training-framework"]], " gym-gazebo": [[84, "gym-gazebo"]], " gym-goddard: Goddard\u2019s Rocket Problem": [[84, "gym-goddard-goddard-s-rocket-problem"]], " gym-jiminy: training Robots in Jiminy": [[84, "gym-jiminy-training-robots-in-jiminy"]], " gym-miniworld": [[84, "gym-miniworld"]], " gym-pybullet-drones": [[84, "gym-pybullet-drones"]], " MarsExplorer": [[84, "marsexplorer"]], " panda-gym ": [[84, "panda-gym"]], " PyBullet Robotics Environments": [[84, "pybullet-robotics-environments"]], " robo-gym": [[84, "robo-gym"]], " Offworld-gym": [[84, "offworld-gym"]], "Autonomous Driving and Traffic Control Environments": [[84, "autonomous-driving-and-traffic-control-environments"]], " gym-carla": [[84, "gym-carla"]], " gym-duckietown": [[84, "gym-duckietown"]], " gym-electric-motor": [[84, "gym-electric-motor"]], " highway-env": [[84, "highway-env"]], " LongiControl": [[84, "longicontrol"]], " sumo-rl": [[84, "sumo-rl"]], " CommonRoad-RL": [[84, "commonroad-rl"]], "Multi-Agents": [[84, "multi-agents"]], "PettingZoo": [[84, "pettingzoo"]], "Other Environments": [[84, "other-environments"]], " anomalous_rl_envs": [[84, "anomalous-rl-envs"]], " CARL": [[84, "carl"]], " CompilerGym": [[84, "compilergym"]], " DACBench": [[84, "dacbench"]], " Gridworld": [[84, "gridworld"]], " gym-adserve": [[84, "gym-adserve"]], " gym-algorithmic": [[84, "gym-algorithmic"]], " gym-anytrading": [[84, "gym-anytrading"]], " gym-autokey": [[84, "gym-autokey"]], " gym-ccc": [[84, "gym-ccc"]], " gym-cellular-automata": [[84, "gym-cellular-automata"]], " gym-games": [[84, "gym-games"]], " gym-inventory": [[84, "gym-inventory"]], " gym-maze": [[84, "gym-maze"]], " gym-mtsim": [[84, "gym-mtsim"]], " gym-legacy-toytext": [[84, "gym-legacy-toytext"]], " gym-riverswim": [[84, "gym-riverswim"]], " gym-recsys": [[84, "gym-recsys"]], " gym-sokoban": [[84, "gym-sokoban"]], " math-prog-synth-env": [[84, "math-prog-synth-env"]], " NASGym": [[84, "nasgym"]], " NLPGym: A toolkit to develop RL agents to solve NLP tasks": [[84, "nlpgym-a-toolkit-to-develop-rl-agents-to-solve-nlp-tasks"]], " Obstacle Tower": [[84, "obstacle-tower"]], " openmodelica-microgrid-gym": [[84, "openmodelica-microgrid-gym"]], " osim-rl": [[84, "osim-rl"]], " PGE: Parallel Game Engine": [[84, "pge-parallel-game-engine"]], " QASGym": [[84, "qasgym"]], " safe-control-gym": [[84, "safe-control-gym"]], " VirtualTaobao": [[84, "virtualtaobao"]], " mo-gym": [[84, "mo-gym"]], "ABIDES-Gym": [[84, "abides-gym"]], "gym-saturation": [[84, "gym-saturation"]], "ShinRL": [[84, "shinrl"]], "racing-rl": [[84, "racing-rl"]], "go-explore": [[84, "go-explore"]], "tmrl": [[84, "tmrl"]], "racing_dreamer": [[84, "racing-dreamer"]], "racecar_gym": [[84, "racecar-gym"]], "jiminy": [[84, "jiminy"]], "evogym-design-tool": [[84, "evogym-design-tool"]], "l2r": [[84, "l2r"]], "gym_torcs": [[84, "gym-torcs"]], "mobile-env": [[84, "mobile-env"]], "gym-softrobot": [[84, "gym-softrobot"]], "PyElastica": [[84, "pyelastica"]], "tuxkart-ai": [[84, "tuxkart-ai"]], "ostrichrl": [[84, "ostrichrl"]], "quadruped-gym": [[84, "quadruped-gym"]], "Pogo-Stick-Jumping": [[84, "pogo-stick-jumping"]], "evogym": [[84, "evogym"]], "iGibson": [[84, "igibson"]], "SnakeRL": [[84, "snakerl"]], "starship-landing-gym": [[84, "starship-landing-gym"]], "CompilerGym": [[84, "id1"]], "RaveForce": [[84, "raveforce"]], "gym-line-follower": [[84, "gym-line-follower"]], "DexterousHands": [[84, "dexteroushands"]], "OmniIsaacGymEnvs": [[84, "omniisaacgymenvs"]], "border": [[84, "border"]], "SpaceRobotEnv": [[84, "spacerobotenv"]], "gymnax": [[84, "gymnax"]], "Toy Text": [[85, "toy-text"]], "Gymnasium is a standard API for reinforcement learning, and a diverse collection of reference environments": [[86, "gymnasium-is-a-standard-api-for-reinforcement-learning-and-a-diverse-collection-of-reference-environments"]], "Solving Blackjack with Q-Learning": [[87, "solving-blackjack-with-q-learning"]], "Imports and Environment Setup": [[87, "imports-and-environment-setup"]], "Observing the environment": [[87, "observing-the-environment"]], "Executing an action": [[87, "executing-an-action"]], "Building an agent": [[87, "building-an-agent"]], "Visualizing the results": [[87, "visualizing-the-results"]], "Make your own custom environment": [[88, "make-your-own-custom-environment"]], "Subclassing gymnasium.Env": [[88, "subclassing-gymnasium-env"]], "Declaration and Initialization": [[88, "declaration-and-initialization"]], "Registering Envs": [[88, "registering-envs"]], "Creating a Package": [[88, "creating-a-package"]], "Creating Environment Instances": [[88, "creating-environment-instances"]], "Using Wrappers": [[88, "using-wrappers"]], "Handling Time Limits": [[89, "handling-time-limits"]], "Termination": [[89, "termination"]], "Truncation": [[89, "truncation"]], "Importance in learning code": [[89, "importance-in-learning-code"]], "Solution": [[89, "solution"]]}, "indexentries": {"env (class in gymnasium)": [[2, "gymnasium.Env"]], "action_space (gymnasium.env attribute)": [[2, "gymnasium.Env.action_space"]], "close() (in module gymnasium.env)": [[2, "gymnasium.Env.close"]], "metadata (gymnasium.env attribute)": [[2, "gymnasium.Env.metadata"]], "np_random (gymnasium.env property)": [[2, "gymnasium.Env.np_random"]], "observation_space (gymnasium.env attribute)": [[2, "gymnasium.Env.observation_space"]], "render() (in module gymnasium.env)": [[2, "gymnasium.Env.render"]], "render_mode (gymnasium.env attribute)": [[2, "gymnasium.Env.render_mode"]], "reset() (in module gymnasium.env)": [[2, "gymnasium.Env.reset"]], "reward_range (gymnasium.env attribute)": [[2, "gymnasium.Env.reward_range"]], "spec (gymnasium.env attribute)": [[2, "gymnasium.Env.spec"]], "step() (in module gymnasium.env)": [[2, "gymnasium.Env.step"]], "unwrapped (gymnasium.env property)": [[2, "gymnasium.Env.unwrapped"]], "make() (in module gymnasium)": [[3, "gymnasium.make"]], "register() (in module gymnasium)": [[3, "gymnasium.register"]], "spec() (in module gymnasium)": [[3, "gymnasium.spec"]], "space (class in gymnasium.spaces)": [[4, "gymnasium.spaces.Space"]], "contains() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.contains"]], "dtype (space property)": [[4, "Space.dtype"]], "from_jsonable() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.from_jsonable"]], "sample() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.sample"]], "seed() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.seed"]], "shape (gymnasium.spaces.space.space property)": [[4, "gymnasium.spaces.space.Space.shape"]], "to_jsonable() (in module gymnasium.spaces.space.space)": [[4, "gymnasium.spaces.space.Space.to_jsonable"]], "dict (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Dict"]], "graph (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Graph"]], "sequence (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Sequence"]], "tuple (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Tuple"]], "sample() (gymnasium.spaces.dict method)": [[5, "gymnasium.spaces.Dict.sample"]], "sample() (gymnasium.spaces.graph method)": [[5, "gymnasium.spaces.Graph.sample"]], "sample() (gymnasium.spaces.sequence method)": [[5, "gymnasium.spaces.Sequence.sample"]], "sample() (gymnasium.spaces.tuple method)": [[5, "gymnasium.spaces.Tuple.sample"]], "seed() (gymnasium.spaces.dict method)": [[5, "gymnasium.spaces.Dict.seed"]], "seed() (gymnasium.spaces.graph method)": [[5, "gymnasium.spaces.Graph.seed"]], "seed() (gymnasium.spaces.sequence method)": [[5, "gymnasium.spaces.Sequence.seed"]], "seed() (gymnasium.spaces.tuple method)": [[5, "gymnasium.spaces.Tuple.seed"]], "box (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Box"]], "discrete (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Discrete"]], "multibinary (class in gymnasium.spaces)": [[6, "gymnasium.spaces.MultiBinary"]], "multidiscrete (class in gymnasium.spaces)": [[6, "gymnasium.spaces.MultiDiscrete"]], "text (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Text"]], "is_bounded() (gymnasium.spaces.box method)": [[6, "gymnasium.spaces.Box.is_bounded"]], "sample() (gymnasium.spaces.box method)": [[6, "gymnasium.spaces.Box.sample"]], "sample() (gymnasium.spaces.discrete method)": [[6, "gymnasium.spaces.Discrete.sample"]], "sample() (gymnasium.spaces.multibinary method)": [[6, "gymnasium.spaces.MultiBinary.sample"]], "sample() (gymnasium.spaces.multidiscrete method)": [[6, "gymnasium.spaces.MultiDiscrete.sample"]], "sample() (gymnasium.spaces.text method)": [[6, "gymnasium.spaces.Text.sample"]], "seed() (gymnasium.spaces.box method)": [[6, "gymnasium.spaces.Box.seed"]], "seed() (gymnasium.spaces.discrete method)": [[6, "gymnasium.spaces.Discrete.seed"]], "seed() (gymnasium.spaces.multibinary method)": [[6, "gymnasium.spaces.MultiBinary.seed"]], "seed() (gymnasium.spaces.multidiscrete method)": [[6, "gymnasium.spaces.MultiDiscrete.seed"]], "seed() (gymnasium.spaces.text method)": [[6, "gymnasium.spaces.Text.seed"]], "flatdim() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.flatdim"]], "flatten() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.flatten"]], "flatten_space() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.flatten_space"]], "unflatten() (in module gymnasium.spaces.utils)": [[7, "gymnasium.spaces.utils.unflatten"]], "batch_space() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.batch_space"]], "concatenate() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.concatenate"]], "create_empty_array() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.create_empty_array"]], "create_shared_memory() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.create_shared_memory"]], "iterate() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.iterate"]], "read_from_shared_memory() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.read_from_shared_memory"]], "write_to_shared_memory() (in module gymnasium.vector.utils)": [[8, "gymnasium.vector.utils.write_to_shared_memory"]], "playplot (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayPlot"]], "playablegame (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayableGame"]], "callback() (gymnasium.utils.play.playplot method)": [[9, "gymnasium.utils.play.PlayPlot.callback"]], "capped_cubic_video_schedule() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.capped_cubic_video_schedule"]], "check_env() (in module gymnasium.utils.env_checker)": [[9, "gymnasium.utils.env_checker.check_env"]], "convert_to_done_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_done_step_api"]], "convert_to_terminated_truncated_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_terminated_truncated_step_api"]], "np_random() (in module gymnasium.utils.seeding)": [[9, "gymnasium.utils.seeding.np_random"]], "play() (in module gymnasium.utils.play)": [[9, "gymnasium.utils.play.play"]], "process_event() (gymnasium.utils.play.playablegame method)": [[9, "gymnasium.utils.play.PlayableGame.process_event"]], "save_video() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.save_video"]], "step_api_compatibility() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.step_api_compatibility"]], "asyncvectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.AsyncVectorEnv"]], "syncvectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.SyncVectorEnv"]], "vectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.VectorEnv"]], "action_space": [[10, "action_space"]], "close() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.close"]], "make() (in module gymnasium.vector)": [[10, "gymnasium.vector.make"]], "observation_space": [[10, "observation_space"]], "reset() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.reset"]], "single_action_space": [[10, "single_action_space"]], "single_observation_space": [[10, "single_observation_space"]], "step() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.step"]], "wrapper (class in gymnasium)": [[11, "gymnasium.Wrapper"]], "action_space (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.action_space"]], "close() (in module gymnasium.wrapper)": [[11, "gymnasium.Wrapper.close"]], "metadata (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.metadata"]], "np_random (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.np_random"]], "observation_space (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.observation_space"]], "reset() (in module gymnasium.wrapper)": [[11, "gymnasium.Wrapper.reset"]], "reward_range (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.reward_range"]], "spec (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.spec"]], "step() (in module gymnasium.wrapper)": [[11, "gymnasium.Wrapper.step"]], "unwrapped (gymnasium.wrapper property)": [[11, "gymnasium.Wrapper.unwrapped"]], "actionwrapper (class in gymnasium)": [[12, "gymnasium.ActionWrapper"]], "actionwrapper.action() (in module gymnasium.actionwrapper)": [[12, "gymnasium.ActionWrapper.ActionWrapper.action"]], "clipaction (class in gymnasium.wrappers)": [[12, "gymnasium.wrappers.ClipAction"]], "rescaleaction (class in gymnasium.wrappers)": [[12, "gymnasium.wrappers.RescaleAction"]], "ataripreprocessing (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.AtariPreprocessing"]], "autoresetwrapper (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.AutoResetWrapper"]], "envcompatibility (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.EnvCompatibility"]], "humanrendering (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.HumanRendering"]], "orderenforcing (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.OrderEnforcing"]], "passiveenvchecker (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.PassiveEnvChecker"]], "recordepisodestatistics (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.RecordEpisodeStatistics"]], "recordvideo (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.RecordVideo"]], "rendercollection (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.RenderCollection"]], "stepapicompatibility (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.StepAPICompatibility"]], "timelimit (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.TimeLimit"]], "vectorlistinfo (class in gymnasium.wrappers)": [[13, "gymnasium.wrappers.VectorListInfo"]], "filterobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.FilterObservation"]], "flattenobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.FlattenObservation"]], "framestack (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.FrameStack"]], "grayscaleobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.GrayScaleObservation"]], "normalizeobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.NormalizeObservation"]], "observationwrapper (class in gymnasium)": [[14, "gymnasium.ObservationWrapper"]], "pixelobservationwrapper (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.PixelObservationWrapper"]], "resizeobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.ResizeObservation"]], "timeawareobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.TimeAwareObservation"]], "transformobservation (class in gymnasium.wrappers)": [[14, "gymnasium.wrappers.TransformObservation"]], "observation() (in module gymnasium.observationwrapper)": [[14, "gymnasium.ObservationWrapper.observation"]], "normalizereward (class in gymnasium.wrappers)": [[15, "gymnasium.wrappers.NormalizeReward"]], "rewardwrapper (class in gymnasium)": [[15, "gymnasium.RewardWrapper"]], "rewardwrapper.reward() (in module gymnasium.rewardwrapper)": [[15, "gymnasium.RewardWrapper.RewardWrapper.reward"]], "transformreward (class in gymnasium.wrappers)": [[15, "gymnasium.wrappers.TransformReward"]]}})