Files
Gymnasium/searchindex.js
2025-07-02 22:33:00 +00:00

1 line
247 KiB
JavaScript

Search.setIndex({"alltitles": {"0.12.5": [[155, "release-0-12-5"]], "0.19.0": [[155, "release-0-19-0"]], "0.22.0": [[155, "release-0-22-0"]], "0.23.0": [[155, "release-0-23-0"]], "0.23.1": [[155, "release-0-23-1"]], "0.24.0": [[155, "release-0-24-0"]], "0.24.1": [[155, "release-0-24-1"]], "0.25.0": [[155, "release-0-25-0"]], "0.25.1": [[155, "release-0-25-1"]], "0.25.2": [[155, "release-0-25-2"]], "0.26.0": [[155, "release-0-26-0"]], "0.26.1": [[155, "release-0-26-1"]], "0.26.2": [[155, "release-0-26-2"]], "1. Package Name Change": [[160, "package-name-change"]], "2. Seeding and Random Number Generation": [[160, "seeding-and-random-number-generation"]], "3. Environment Reset Changes": [[160, "environment-reset-changes"]], "4. Step Function: The done \u2192 terminated/truncated Split": [[160, "step-function-the-done-terminated-truncated-split"]], "404 - Page Not Found": [[0, null]], "5. Render Mode Changes": [[160, "render-mode-changes"]], "About the Environment: Blackjack": [[163, "about-the-environment-blackjack"]], "Acrobot": [[131, null]], "Action Masking in the Taxi Environment": [[173, null]], "Action Space": [[127, "action-space"], [128, "action-space"], [129, "action-space"], [131, "action-space"], [132, "action-space"], [133, "action-space"], [134, "action-space"], [135, "action-space"], [137, "action-space"], [138, "action-space"], [139, "action-space"], [140, "action-space"], [141, "action-space"], [142, "action-space"], [143, "action-space"], [144, "action-space"], [145, "action-space"], [146, "action-space"], [147, "action-space"], [150, "action-space"], [151, "action-space"], [152, "action-space"], [153, "action-space"], [154, "action-space"]], "Action Space Issues": [[159, "action-space-issues"]], "Action Wrappers": [[16, null]], "Action and observation spaces": [[158, "action-and-observation-spaces"]], "Adding Rendering": [[159, "adding-rendering"]], "Adding a new environment": [[1, "adding-a-new-environment"]], "Additional Methods": [[10, "additional-methods"], [11, "additional-methods"], [12, "additional-methods"]], "Additional functions": [[4, "additional-functions"]], "Advanced Environment Features": [[159, "advanced-environment-features"]], "Advantage Actor-Critic (A2C)": [[178, "advantage-actor-critic-a2c"]], "Adventure": [[22, null]], "AgileRL": [[171, "agilerl"]], "Air Raid": [[23, null]], "Algorithmic heuristics": [[162, "algorithmic-heuristics"]], "Alien": [[24, null]], "Alternative solutions": [[165, "alternative-solutions"]], "Amidar": [[25, null]], "Analyzing Training Results": [[163, "analyzing-training-results"]], "Ant": [[137, null]], "Arguments": [[127, "arguments"], [128, "arguments"], [129, "arguments"], [131, "arguments"], [132, "arguments"], [133, "arguments"], [134, "arguments"], [135, "arguments"], [137, "arguments"], [138, "arguments"], [139, "arguments"], [140, "arguments"], [141, "arguments"], [142, "arguments"], [143, "arguments"], [144, "arguments"], [145, "arguments"], [146, "arguments"], [147, "arguments"], [150, "arguments"], [151, "arguments"], [152, "arguments"], [153, "arguments"], [154, "arguments"]], "Assault": [[26, null]], "Asterix": [[27, null]], "Asteroids": [[28, null]], "AsyncVectorEnv": [[11, null]], "Atari": [[21, null]], "Atlantis": [[29, null]], "Atlantis2": [[30, null]], "Attributes": [[2, "attributes"], [5, "attributes"], [10, "attributes"], [15, "attributes"]], "Autonomous Driving environments": [[148, "autonomous-driving-environments"], [148, "id2"]], "Available Action Wrappers": [[16, "available-action-wrappers"]], "Backgammon": [[31, null]], "Bank Heist": [[32, null]], "Base Class": [[16, "base-class"]], "Basic Math": [[33, null]], "Basic Usage": [[158, null]], "Battle Zone": [[34, null]], "Beam Rider": [[35, null]], "Before You Code: Environment Design": [[159, "before-you-code-environment-design"]], "Berzerk": [[36, null]], "Best Practices Summary": [[161, "best-practices-summary"]], "Biological / Medical environments": [[148, "biological-medical-environments"]], "Bipedal Walker": [[127, null]], "Blackjack": [[37, null], [150, null]], "Boundary Handling Errors": [[159, "boundary-handling-errors"]], "Bowling": [[38, null]], "Box2D": [[126, null]], "Boxing": [[39, null]], "Breakout": [[40, null]], "Build the Documentation": [[1, "build-the-documentation"]], "Building a Q-Learning Agent": [[163, "building-a-q-learning-agent"]], "Building an agent": [[174, "building-an-agent"], [177, "building-an-agent"]], "Car Racing": [[128, null]], "Carnival": [[41, null]], "Cart Pole": [[132, null]], "Casino": [[42, null]], "Centipede": [[43, null]], "Check Environment Validity": [[159, "check-environment-validity"]], "Chopper Command": [[44, null]], "Classic Control": [[130, null]], "Cliff Walking": [[151, null]], "Cliff Walking Slippery": [[152, null]], "Close": [[165, "close"]], "Common Debug Issues": [[159, "common-debug-issues"]], "Common Environment Design Pitfalls": [[159, "common-environment-design-pitfalls"]], "Common Issues for Beginners": [[158, "common-issues-for-beginners"]], "Common Training Issues and Solutions": [[163, "common-training-issues-and-solutions"]], "Common Wrappers": [[17, "common-wrappers"]], "Comparing training performance across versions": [[136, "comparing-training-performance-across-versions"]], "Compatibility Helpers": [[160, "compatibility-helpers"]], "Composite Spaces": [[5, "composite-spaces"], [6, null]], "Constructing Observations": [[159, "constructing-observations"]], "Constructing Observations From Environment States": [[165, "constructing-observations-from-environment-states"]], "Converting Jax-based Functional environments to standard Env": [[3, "converting-jax-based-functional-environments-to-standard-env"]], "Core variables": [[4, "core-variables"]], "Crazy Climber": [[45, null]], "Create a Custom Environment": [[159, null]], "Creating Environment Instances": [[165, "creating-environment-instances"]], "Creating a Package": [[165, "creating-a-package"]], "Creating environments": [[2, "creating-environments"]], "Creating the Q-table": [[175, "creating-the-q-table"]], "Credits": [[127, "credits"], [128, "credits"], [129, "credits"]], "Crossbow": [[46, null]], "Darkchambers": [[47, null]], "Data Conversion Wrappers": [[17, "data-conversion-wrappers"]], "Debugging Your Environment": [[159, "debugging-your-environment"]], "Declaration and Initialization": [[165, "declaration-and-initialization"]], "Defender": [[48, null]], "Demon Attack": [[49, null]], "Description": [[127, "description"], [128, "description"], [129, "description"], [131, "description"], [132, "description"], [133, "description"], [134, "description"], [135, "description"], [137, "description"], [138, "description"], [139, "description"], [140, "description"], [141, "description"], [142, "description"], [143, "description"], [144, "description"], [145, "description"], [146, "description"], [147, "description"], [150, "description"], [151, "description"], [152, "description"], [153, "description"], [154, "description"]], "Design for Learning": [[159, "design-for-learning"]], "Domain Randomization": [[178, "domain-randomization"]], "Donkey Kong": [[50, null]], "Double Dunk": [[51, null]], "Earthworld": [[52, null]], "Economic / Financial environments": [[148, "economic-financial-environments"]], "Editing an environment page": [[1, "editing-an-environment-page"]], "Electrical / Energy environments": [[148, "electrical-energy-environments"]], "Elevator Action": [[53, null]], "Enduro": [[54, null]], "Entombed": [[55, null]], "Env": [[2, null]], "Environment Checking": [[9, "environment-checking"]], "Environment __init__": [[159, "environment-init"]], "Environment pickling": [[9, "environment-pickling"]], "Environment-Specific Changes": [[160, "environment-specific-changes"]], "Epilogue": [[169, "epilogue"]], "Episode End": [[131, "episode-end"], [132, "episode-end"], [133, "episode-end"], [134, "episode-end"], [137, "episode-end"], [138, "episode-end"], [139, "episode-end"], [140, "episode-end"], [141, "episode-end"], [142, "episode-end"], [143, "episode-end"], [144, "episode-end"], [145, "episode-end"], [146, "episode-end"], [147, "episode-end"], [150, "episode-end"], [151, "episode-end"], [152, "episode-end"], [153, "episode-end"], [154, "episode-end"]], "Episode Termination": [[127, "episode-termination"], [128, "episode-termination"], [129, "episode-termination"]], "Episode Truncation": [[135, "episode-truncation"]], "Et": [[56, null]], "Exact reproducibility": [[136, "exact-reproducibility"]], "Executing an action": [[163, "executing-an-action"], [174, "executing-an-action"]], "Explaining the Code Step by Step": [[158, "explaining-the-code-step-by-step"]], "Exploration vs Exploitation": [[163, "exploration-vs-exploitation"]], "External Environments": [[148, null]], "First-Party Environments": [[148, "first-party-environments"]], "Fishing Derby": [[57, null]], "Flag Capture": [[58, null]], "Freeway": [[59, null]], "Frogger": [[60, null]], "Frostbite": [[61, null]], "Frozen Lake": [[153, null]], "Functional Env": [[3, null]], "Fundamental Spaces": [[5, "fundamental-spaces"], [7, null]], "Galaxian": [[62, null]], "Game environments": [[148, "game-environments"]], "Generate your environment": [[165, "generate-your-environment"]], "Getting Help": [[160, "getting-help"]], "Gopher": [[63, null]], "Gravitar": [[64, null]], "GridWorld Example Design": [[159, "gridworld-example-design"]], "Gym Migration Guide": [[160, null]], "Gym Release Notes": [[155, null]], "Gymnasium Basics": [[164, null], [168, null], [170, "gymnasium-basics"]], "Gymnasium Release Notes": [[156, null]], "Gymnasium v1.1.1": [[156, "release-v1-1-1"]], "Gymnasium-docs": [[1, null]], "Gymnasium.vector.VectorEnv": [[10, "gymnasium-vector-vectorenv"]], "Half Cheetah": [[138, null]], "Handling Time Limits": [[166, null]], "Hangman": [[65, null]], "Haunted House": [[66, null]], "Hero": [[67, null]], "Hopper": [[139, null]], "How Action Masking Works": [[173, "how-action-masking-works"]], "Human Cannonball": [[68, null]], "Humanoid": [[140, null]], "Humanoid Standup": [[141, null]], "Ice Hockey": [[69, null]], "Implemented Action wrappers": [[14, "implemented-action-wrappers"]], "Implemented Data Conversion wrappers": [[14, "implemented-data-conversion-wrappers"]], "Implemented Observation wrappers": [[14, "implemented-observation-wrappers"]], "Implemented Reward wrappers": [[14, "implemented-reward-wrappers"]], "Implemented Wrappers": [[18, "implemented-wrappers"], [19, "implemented-wrappers"]], "Implementing Custom Wrappers": [[167, null]], "Implementing environments": [[2, "implementing-environments"]], "Importance in learning code": [[166, "importance-in-learning-code"]], "Imports and Environment Setup": [[174, "imports-and-environment-setup"]], "Information": [[150, "information"], [151, "information"], [152, "information"], [153, "information"], [154, "information"]], "Inheriting from gymnasium.ActionWrapper": [[167, "inheriting-from-gymnasium-actionwrapper"]], "Inheriting from gymnasium.ObservationWrapper": [[167, "inheriting-from-gymnasium-observationwrapper"]], "Inheriting from gymnasium.RewardWrapper": [[167, "inheriting-from-gymnasium-rewardwrapper"]], "Inheriting from gymnasium.Wrapper": [[167, "inheriting-from-gymnasium-wrapper"]], "Initializing Environments": [[158, "initializing-environments"]], "Instructions for modifying environment pages": [[1, "instructions-for-modifying-environment-pages"]], "Integration with Experiment Tracking": [[161, "integration-with-experiment-tracking"]], "Interpreting the Results": [[163, "interpreting-the-results"]], "Introduction": [[178, "introduction"]], "Inverted Double Pendulum": [[142, null]], "Inverted Pendulum": [[143, null]], "Jamesbond": [[70, null]], "Johnny Code from Youtube": [[171, "johnny-code-from-youtube"]], "Journey Escape": [[71, null]], "Kaboom": [[72, null]], "Kangaroo": [[73, null]], "Key Changes Breakdown": [[160, "key-changes-breakdown"]], "Key Design Questions": [[159, "key-design-questions"]], "Keystone Kapers": [[74, null]], "King Kong": [[75, null]], "Klax": [[76, null]], "Koolaid": [[77, null]], "Krull": [[78, null]], "Kung Fu Master": [[79, null]], "Laser Gates": [[80, null]], "List of Wrappers": [[20, null]], "Load custom quadruped robot environments": [[169, null]], "Loading OpenAI Gym environments": [[160, "loading-openai-gym-environments"]], "Lost Luggage": [[81, null]], "Lunar Lander": [[129, null]], "Make and register": [[4, null]], "Make your own custom environment": [[165, null]], "Making Vector Environments": [[10, "making-vector-environments"]], "Manual Testing with Known Actions": [[159, "manual-testing-with-known-actions"]], "Map size: 11 \\times 11": [[175, "map-size-11-times-11"]], "Map size: 4 \\times 4": [[175, "map-size-4-times-4"]], "Map size: 7 \\times 7": [[175, "map-size-7-times-7"]], "Map size: 9 \\times 9": [[175, "map-size-9-times-9"]], "Mario Bros": [[82, null]], "Mathematics / Computational": [[148, "mathematics-computational"]], "Methods": [[2, "methods"], [5, "methods"], [10, "methods"], [15, "methods"]], "Miniature Golf": [[83, null]], "Misc Wrappers": [[17, null]], "Miscellaneous": [[13, "miscellaneous"]], "Modifying the environment": [[158, "modifying-the-environment"]], "Montezuma Revenge": [[84, null]], "More Information": [[161, "more-information"]], "Mountain Car": [[133, null]], "Mountain Car Continuous": [[134, null]], "Mr Do": [[85, null]], "Ms Pacman": [[86, null]], "MuJoCo": [[136, null]], "Name This Game": [[87, null]], "New v0.26+ Code (Including v1.0.0)": [[160, "new-v0-26-code-including-v1-0-0"]], "Next Steps": [[158, "next-steps"], [159, "next-steps"], [163, "next-steps"]], "Notes": [[129, "notes"], [146, "notes"]], "Notice": [[178, "notice"]], "Observation Space": [[127, "observation-space"], [128, "observation-space"], [129, "observation-space"], [131, "observation-space"], [132, "observation-space"], [133, "observation-space"], [134, "observation-space"], [135, "observation-space"], [137, "observation-space"], [138, "observation-space"], [139, "observation-space"], [140, "observation-space"], [141, "observation-space"], [142, "observation-space"], [143, "observation-space"], [144, "observation-space"], [145, "observation-space"], [146, "observation-space"], [147, "observation-space"], [150, "observation-space"], [151, "observation-space"], [152, "observation-space"], [153, "observation-space"], [154, "observation-space"]], "Observation Wrappers": [[18, null]], "Observing the environment": [[174, "observing-the-environment"]], "Old to New Step API Compatibility": [[9, "old-to-new-step-api-compatibility"]], "Old v0.21 Code": [[160, "old-v0-21-code"]], "Optimizing training": [[162, "optimizing-training"]], "Othello": [[88, null]], "Other": [[148, "other"]], "Other environments": [[148, "other-environments"]], "Other steps": [[1, "other-steps"]], "Pacman": [[89, null]], "Parameterized Environments": [[159, "parameterized-environments"]], "Parameters we\u2019ll use": [[175, "parameters-we-ll-use"]], "Pendulum": [[135, null]], "Performance Analysis of Synchronous and Asynchronous Vectorized Environments": [[178, "performance-analysis-of-synchronous-and-asynchronous-vectorized-environments"]], "Phoenix": [[90, null]], "Pitfall": [[91, null]], "Pitfall2": [[92, null]], "Plot learning curve": [[177, "plot-learning-curve"]], "Plotting": [[178, "plotting"]], "Policy Network": [[177, "policy-network"]], "Pong": [[93, null]], "Pooyan": [[94, null]], "Private Eye": [[95, null]], "Pusher": [[144, null]], "Qbert": [[96, null]], "Quick Reference: Complete Changes Table": [[160, "quick-reference-complete-changes-table"]], "Reacher": [[145, null]], "Real-World Environment Design Tips": [[159, "real-world-environment-design-tips"]], "Recommended solution": [[165, "recommended-solution"]], "Recording Agents": [[161, null]], "Recording During Training (Periodic)": [[161, "recording-during-training-periodic"]], "Recording Every Episode (Evaluation)": [[161, "recording-every-episode-evaluation"]], "References": [[128, "references"], [131, "references"], [150, "references"], [151, "references"], [152, "references"], [154, "references"], [175, "references"], [177, "references"], [178, "references"]], "Registering Envs": [[165, "registering-envs"]], "Registering and making the environment": [[159, "registering-and-making-the-environment"]], "Removed Environments": [[160, "removed-environments"]], "Rendering": [[165, "rendering"]], "Rendering Arguments": [[136, "rendering-arguments"]], "Rendering Backend": [[136, "rendering-backend"]], "Reset": [[165, "reset"]], "Reset Arguments": [[128, "reset-arguments"]], "Reset function": [[159, "reset-function"]], "Results Analysis": [[173, "results-analysis"]], "Reward": [[134, "reward"], [151, "reward"], [152, "reward"]], "Reward Design Issues": [[159, "reward-design-issues"]], "Reward Wrappers": [[19, null]], "Reward:": [[133, "reward"]], "Rewards": [[127, "rewards"], [128, "rewards"], [129, "rewards"], [131, "rewards"], [132, "rewards"], [135, "rewards"], [137, "rewards"], [138, "rewards"], [139, "rewards"], [140, "rewards"], [141, "rewards"], [142, "rewards"], [143, "rewards"], [144, "rewards"], [145, "rewards"], [146, "rewards"], [147, "rewards"], [150, "rewards"], [153, "rewards"], [154, "rewards"]], "Riverraid": [[97, null]], "Road Runner": [[98, null]], "Robotank": [[99, null]], "Robotics environments": [[148, "robotics-environments"], [148, "id1"]], "Running the Experiment": [[173, "running-the-experiment"]], "Running the environment": [[175, "running-the-environment"]], "Runtime Performance benchmark": [[9, "runtime-performance-benchmark"]], "Save Rendering Videos": [[9, "save-rendering-videos"]], "Saving/ Loading Weights": [[178, "saving-loading-weights"]], "Seaquest": [[100, null]], "Seeding": [[9, "seeding"]], "Setup": [[165, "setup"], [169, "setup"], [178, "setup"]], "Shared Memory for a Space": [[13, "shared-memory-for-a-space"]], "Showcase the Agent": [[178, "showcase-the-agent"]], "Side-by-Side Code Comparison": [[160, "side-by-side-code-comparison"]], "Sir Lancelot": [[101, null]], "Skiing": [[102, null]], "Solaris": [[103, null]], "Solution": [[166, "solution"]], "Solving Blackjack with Tabular Q-Learning": [[174, null]], "Solving Frozenlake with Tabular Q-Learning": [[175, null]], "Space Invaders": [[104, null]], "Space War": [[105, null]], "Spaces": [[5, null]], "Spaces Utils": [[8, null]], "Speeding Up Training": [[162, null]], "Speeding up A2C Training with Vector Envs": [[178, null]], "Star Gunner": [[106, null]], "Start Simple, Add Complexity Gradually": [[159, "start-simple-add-complexity-gradually"]], "Starting State": [[127, "starting-state"], [128, "starting-state"], [129, "starting-state"], [131, "starting-state"], [132, "starting-state"], [133, "starting-state"], [134, "starting-state"], [135, "starting-state"], [137, "starting-state"], [138, "starting-state"], [139, "starting-state"], [140, "starting-state"], [141, "starting-state"], [142, "starting-state"], [143, "starting-state"], [144, "starting-state"], [145, "starting-state"], [146, "starting-state"], [147, "starting-state"], [150, "starting-state"], [151, "starting-state"], [152, "starting-state"], [153, "starting-state"], [154, "starting-state"]], "State Representation Problems": [[159, "state-representation-problems"]], "Step": [[165, "step"]], "Step 0.1 - Download a Robot Model": [[169, "step-0-1-download-a-robot-model"]], "Step 1 - Load the model": [[169, "step-1-load-the-model"]], "Step 2 - Tweaking the Environment Parameters": [[169, "step-2-tweaking-the-environment-parameters"]], "Step 2.1 - Tweaking the Environment Simulation Parameters": [[169, "step-2-1-tweaking-the-environment-simulation-parameters"]], "Step 2.2 - Tweaking the Environment Termination Parameters": [[169, "step-2-2-tweaking-the-environment-termination-parameters"]], "Step 2.3 - Tweaking the Environment Reward Parameters": [[169, "step-2-3-tweaking-the-environment-reward-parameters"]], "Step 2.4 - Tweaking the Environment Observation Parameters": [[169, "step-2-4-tweaking-the-environment-observation-parameters"]], "Step 3 - Train your Agent": [[169, "step-3-train-your-agent"]], "Step API Compatibility": [[160, "step-api-compatibility"]], "Step function": [[159, "step-function"]], "Subclassing gymnasium.Env": [[165, "subclassing-gymnasium-env"]], "Superman": [[107, null]], "Surround": [[108, null]], "Swimmer": [[146, null]], "SyncVectorEnv": [[12, null]], "Taxi": [[154, null]], "Telecommunication Systems environments": [[148, "telecommunication-systems-environments"]], "Tennis": [[109, null]], "Termination": [[137, "termination"], [138, "termination"], [139, "termination"], [140, "termination"], [141, "termination"], [142, "termination"], [143, "termination"], [144, "termination"], [145, "termination"], [146, "termination"], [147, "termination"], [166, "termination"]], "Testing Your Migration": [[160, "testing-your-migration"]], "Testing Your Trained Agent": [[163, "testing-your-trained-agent"]], "Tetris": [[110, null]], "The FrozenLake environment": [[175, "the-frozenlake-environment"]], "The Learning Process": [[163, "the-learning-process"]], "The Training Loop": [[163, "the-training-loop"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Think About Your Research Question": [[159, "think-about-your-research-question"]], "Think you can do better?": [[174, "think-you-can-do-better"]], "Third-Party Environments using Gym": [[148, "third-party-environments-using-gym"]], "Third-Party Tutorials": [[171, null]], "Third-Party tutorials about gymnasium": [[171, "third-party-tutorials-about-gymnasium"]], "Third-Party tutorials about libraries that use gymnasium": [[171, "third-party-tutorials-about-libraries-that-use-gymnasium"]], "Third-party environments with Gymnasium": [[148, "third-party-environments-with-gymnasium"]], "Tic Tac Toe 3D": [[111, null]], "Time Pilot": [[112, null]], "TimeLimit Wrapper Changes": [[160, "timelimit-wrapper-changes"]], "Toy Text": [[149, null]], "Training Agents": [[170, "training-agents"], [172, null], [176, null]], "Training Recording Benefits": [[161, "training-recording-benefits"]], "Training an Agent": [[163, null]], "Training the A2C Agent": [[178, "training-the-a2c-agent"]], "Training the Agent": [[163, "training-the-agent"]], "Training using REINFORCE for Mujoco": [[177, null]], "Transition Dynamics:": [[133, "transition-dynamics"], [134, "transition-dynamics"]], "Trondead": [[113, null]], "Truncation": [[137, "truncation"], [138, "truncation"], [139, "truncation"], [140, "truncation"], [141, "truncation"], [142, "truncation"], [143, "truncation"], [144, "truncation"], [145, "truncation"], [146, "truncation"], [147, "truncation"], [166, "truncation"]], "Try playing the environment yourself": [[178, "try-playing-the-environment-yourself"]], "Turmoil": [[114, null]], "Tutankham": [[115, null]], "Tutorials": [[170, null]], "Uncommon Wrappers": [[17, "uncommon-wrappers"]], "Understanding Q-Learning Intuitively": [[163, "understanding-q-learning-intuitively"]], "Understanding the Agent-Environment Loop": [[158, "understanding-the-agent-environment-loop"]], "Understanding the Output": [[161, "understanding-the-output"]], "Understanding the Q-Learning Update": [[163, "understanding-the-q-learning-update"]], "Understanding the Taxi Environment": [[173, "understanding-the-taxi-environment"]], "Up N Down": [[116, null]], "Using Vectorized Environments": [[178, "using-vectorized-environments"]], "Using Wrappers": [[159, "using-wrappers"], [165, "using-wrappers"]], "Utility functions": [[5, "utility-functions"], [9, null], [13, null]], "Vector Only wrappers": [[14, "vector-only-wrappers"]], "Vector Utility functions": [[5, "vector-utility-functions"]], "Vector only Wrappers": [[20, "vector-only-wrappers"]], "Vectorize": [[10, null]], "Vectorized Common wrappers": [[14, "vectorized-common-wrappers"]], "Vectorized environment": [[132, "vectorized-environment"]], "Vectorized environments": [[162, "vectorized-environments"]], "Vectorizing Spaces": [[13, "vectorizing-spaces"]], "Venture": [[117, null]], "Version History": [[127, "version-history"], [128, "version-history"], [129, "version-history"], [131, "version-history"], [132, "version-history"], [133, "version-history"], [134, "version-history"], [135, "version-history"], [137, "version-history"], [138, "version-history"], [139, "version-history"], [140, "version-history"], [141, "version-history"], [142, "version-history"], [143, "version-history"], [144, "version-history"], [145, "version-history"], [146, "version-history"], [147, "version-history"], [150, "version-history"], [151, "version-history"], [152, "version-history"], [153, "version-history"], [154, "version-history"]], "Versions": [[136, "versions"]], "Video Checkers": [[118, null]], "Video Chess": [[119, null]], "Video Cube": [[120, null]], "Video Game environments": [[148, "video-game-environments"]], "Video Pinball": [[121, null]], "Visualising the policy": [[174, "visualising-the-policy"]], "Visualization": [[9, "visualization"], [175, "visualization"]], "Visualizing Results": [[173, "visualizing-results"]], "Visualizing the training": [[174, "visualizing-the-training"]], "Walker2D": [[147, null]], "What is Reinforcement Learning?": [[158, "what-is-reinforcement-learning"]], "What to Expect During Training": [[163, "what-to-expect-during-training"]], "When to Record": [[161, "when-to-record"]], "Who Should Read This Guide?": [[160, "who-should-read-this-guide"]], "Why Did the API Change?": [[160, "why-did-the-api-change"]], "Why Gymnasium?": [[158, "why-gymnasium"]], "Why Record Your Agent?": [[161, "why-record-your-agent"]], "Wizard Of Wor": [[122, null]], "Word Zapper": [[123, null]], "Wrappers": [[14, null], [15, null]], "Writing Tutorials": [[1, "writing-tutorials"]], "Yars Revenge": [[124, null]], "Your First RL Program": [[158, "your-first-rl-program"]], "Zaxxon": [[125, null]], "freeCodeCamp from Youtube": [[171, "freecodecamp-from-youtube"]], "v0.20.0": [[155, "release-v0-20-0"]], "v0.21.0": [[155, "release-v0-21-0"]], "v0.26.0: Initial Release": [[156, "release-v0-26-0"]], "v0.26.1": [[156, "release-v0-26-1"]], "v0.26.2 ": [[156, "release-v0-26-2"]], "v0.26.3": [[156, "release-v0-26-3"]], "v0.27.0": [[156, "release-v0-27-0"]], "v0.27.1": [[156, "release-v0-27-1"]], "v0.28.0": [[156, "release-v0-28-0"]], "v0.28.1": [[156, "release-v0-28-1"]], "v0.29.0": [[156, "release-v0-29-0"]], "v0.29.1 ": [[156, "release-v0-29-1"]], "v0.7.3": [[155, "release-v0-7-3"]], "v0.7.4": [[155, "release-v0-7-4"]], "v0.9.5": [[155, "release-v0-9-5"]], "v0.9.6": [[155, "release-v0-9-6"]], "v1.0.0": [[156, "release-v1-0-0"]], "v1.0.0a1: v1.0.0 alpha1 ": [[156, "release-v1-0-0a1"]], "v1.0.0a2: v1.0.0 alpha 2": [[156, "release-v1-0-0a2"]], "v1.1.0": [[156, "release-v1-1-0"]], "v1.2.0": [[156, "release-v1-2-0"]], "\ud83d\udea8 Agent Gets Stuck in Poor Strategy": [[163, "agent-gets-stuck-in-poor-strategy"]], "\ud83d\udea8 Agent Never Improves": [[163, "agent-never-improves"]], "\ud83d\udea8 Learning Too Slow": [[163, "learning-too-slow"]], "\ud83d\udea8 Unstable Training": [[163, "unstable-training"]]}, "docnames": ["404", "README", "api/env", "api/functional", "api/registry", "api/spaces", "api/spaces/composite", "api/spaces/fundamental", "api/spaces/utils", "api/utils", "api/vector", "api/vector/async_vector_env", "api/vector/sync_vector_env", "api/vector/utils", "api/vector/wrappers", "api/wrappers", "api/wrappers/action_wrappers", "api/wrappers/misc_wrappers", "api/wrappers/observation_wrappers", "api/wrappers/reward_wrappers", "api/wrappers/table", "environments/atari", "environments/atari/adventure", "environments/atari/air_raid", "environments/atari/alien", "environments/atari/amidar", "environments/atari/assault", "environments/atari/asterix", "environments/atari/asteroids", "environments/atari/atlantis", "environments/atari/atlantis2", "environments/atari/backgammon", "environments/atari/bank_heist", "environments/atari/basic_math", "environments/atari/battle_zone", "environments/atari/beam_rider", "environments/atari/berzerk", "environments/atari/blackjack", "environments/atari/bowling", "environments/atari/boxing", "environments/atari/breakout", "environments/atari/carnival", "environments/atari/casino", "environments/atari/centipede", "environments/atari/chopper_command", "environments/atari/crazy_climber", "environments/atari/crossbow", "environments/atari/darkchambers", "environments/atari/defender", "environments/atari/demon_attack", "environments/atari/donkey_kong", "environments/atari/double_dunk", "environments/atari/earthworld", "environments/atari/elevator_action", "environments/atari/enduro", "environments/atari/entombed", "environments/atari/et", "environments/atari/fishing_derby", "environments/atari/flag_capture", "environments/atari/freeway", "environments/atari/frogger", "environments/atari/frostbite", "environments/atari/galaxian", "environments/atari/gopher", "environments/atari/gravitar", "environments/atari/hangman", "environments/atari/haunted_house", "environments/atari/hero", "environments/atari/human_cannonball", "environments/atari/ice_hockey", "environments/atari/jamesbond", "environments/atari/journey_escape", "environments/atari/kaboom", "environments/atari/kangaroo", "environments/atari/keystone_kapers", "environments/atari/king_kong", "environments/atari/klax", "environments/atari/koolaid", "environments/atari/krull", "environments/atari/kung_fu_master", "environments/atari/laser_gates", "environments/atari/lost_luggage", "environments/atari/mario_bros", "environments/atari/miniature_golf", "environments/atari/montezuma_revenge", "environments/atari/mr_do", "environments/atari/ms_pacman", "environments/atari/name_this_game", "environments/atari/othello", "environments/atari/pacman", "environments/atari/phoenix", "environments/atari/pitfall", "environments/atari/pitfall2", "environments/atari/pong", "environments/atari/pooyan", "environments/atari/private_eye", "environments/atari/qbert", "environments/atari/riverraid", "environments/atari/road_runner", "environments/atari/robotank", "environments/atari/seaquest", "environments/atari/sir_lancelot", "environments/atari/skiing", "environments/atari/solaris", "environments/atari/space_invaders", "environments/atari/space_war", "environments/atari/star_gunner", "environments/atari/superman", "environments/atari/surround", "environments/atari/tennis", "environments/atari/tetris", "environments/atari/tic_tac_toe_3d", "environments/atari/time_pilot", "environments/atari/trondead", "environments/atari/turmoil", "environments/atari/tutankham", "environments/atari/up_n_down", "environments/atari/venture", "environments/atari/video_checkers", "environments/atari/video_chess", "environments/atari/video_cube", "environments/atari/video_pinball", "environments/atari/wizard_of_wor", "environments/atari/word_zapper", "environments/atari/yars_revenge", "environments/atari/zaxxon", "environments/box2d", "environments/box2d/bipedal_walker", "environments/box2d/car_racing", "environments/box2d/lunar_lander", "environments/classic_control", "environments/classic_control/acrobot", "environments/classic_control/cart_pole", "environments/classic_control/mountain_car", "environments/classic_control/mountain_car_continuous", "environments/classic_control/pendulum", "environments/mujoco", "environments/mujoco/ant", "environments/mujoco/half_cheetah", "environments/mujoco/hopper", "environments/mujoco/humanoid", "environments/mujoco/humanoid_standup", "environments/mujoco/inverted_double_pendulum", "environments/mujoco/inverted_pendulum", "environments/mujoco/pusher", "environments/mujoco/reacher", "environments/mujoco/swimmer", "environments/mujoco/walker2d", "environments/third_party_environments", "environments/toy_text", "environments/toy_text/blackjack", "environments/toy_text/cliff_walking", "environments/toy_text/cliff_walking_slippery", "environments/toy_text/frozen_lake", "environments/toy_text/taxi", "gym_release_notes/index", "gymnasium_release_notes/index", "index", "introduction/basic_usage", "introduction/create_custom_env", "introduction/migration_guide", "introduction/record_agent", "introduction/speed_up_env", "introduction/train_agent", "tutorials/gymnasium_basics/README", "tutorials/gymnasium_basics/environment_creation", "tutorials/gymnasium_basics/handling_time_limits", "tutorials/gymnasium_basics/implementing_custom_wrappers", "tutorials/gymnasium_basics/index", "tutorials/gymnasium_basics/load_quadruped_model", "tutorials/index", "tutorials/third-party-tutorials", "tutorials/training_agents/README", "tutorials/training_agents/action_masking_taxi", "tutorials/training_agents/blackjack_q_learning", "tutorials/training_agents/frozenlake_q_learning", "tutorials/training_agents/index", "tutorials/training_agents/mujoco_reinforce", "tutorials/training_agents/vector_a2c"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1}, "filenames": ["404.md", "README.md", "api/env.md", "api/functional.md", "api/registry.md", "api/spaces.md", "api/spaces/composite.md", "api/spaces/fundamental.md", "api/spaces/utils.md", "api/utils.md", "api/vector.md", "api/vector/async_vector_env.md", "api/vector/sync_vector_env.md", "api/vector/utils.md", "api/vector/wrappers.md", "api/wrappers.md", "api/wrappers/action_wrappers.md", "api/wrappers/misc_wrappers.md", "api/wrappers/observation_wrappers.md", "api/wrappers/reward_wrappers.md", "api/wrappers/table.md", "environments/atari.md", "environments/atari/adventure.md", "environments/atari/air_raid.md", "environments/atari/alien.md", "environments/atari/amidar.md", "environments/atari/assault.md", "environments/atari/asterix.md", "environments/atari/asteroids.md", "environments/atari/atlantis.md", "environments/atari/atlantis2.md", "environments/atari/backgammon.md", "environments/atari/bank_heist.md", "environments/atari/basic_math.md", "environments/atari/battle_zone.md", "environments/atari/beam_rider.md", "environments/atari/berzerk.md", "environments/atari/blackjack.md", "environments/atari/bowling.md", "environments/atari/boxing.md", "environments/atari/breakout.md", "environments/atari/carnival.md", "environments/atari/casino.md", "environments/atari/centipede.md", "environments/atari/chopper_command.md", "environments/atari/crazy_climber.md", "environments/atari/crossbow.md", "environments/atari/darkchambers.md", "environments/atari/defender.md", "environments/atari/demon_attack.md", "environments/atari/donkey_kong.md", "environments/atari/double_dunk.md", "environments/atari/earthworld.md", "environments/atari/elevator_action.md", "environments/atari/enduro.md", "environments/atari/entombed.md", "environments/atari/et.md", "environments/atari/fishing_derby.md", "environments/atari/flag_capture.md", "environments/atari/freeway.md", "environments/atari/frogger.md", "environments/atari/frostbite.md", "environments/atari/galaxian.md", "environments/atari/gopher.md", "environments/atari/gravitar.md", "environments/atari/hangman.md", "environments/atari/haunted_house.md", "environments/atari/hero.md", "environments/atari/human_cannonball.md", "environments/atari/ice_hockey.md", "environments/atari/jamesbond.md", "environments/atari/journey_escape.md", "environments/atari/kaboom.md", "environments/atari/kangaroo.md", "environments/atari/keystone_kapers.md", "environments/atari/king_kong.md", "environments/atari/klax.md", "environments/atari/koolaid.md", "environments/atari/krull.md", "environments/atari/kung_fu_master.md", "environments/atari/laser_gates.md", "environments/atari/lost_luggage.md", "environments/atari/mario_bros.md", "environments/atari/miniature_golf.md", "environments/atari/montezuma_revenge.md", "environments/atari/mr_do.md", "environments/atari/ms_pacman.md", "environments/atari/name_this_game.md", "environments/atari/othello.md", "environments/atari/pacman.md", "environments/atari/phoenix.md", "environments/atari/pitfall.md", "environments/atari/pitfall2.md", "environments/atari/pong.md", "environments/atari/pooyan.md", "environments/atari/private_eye.md", "environments/atari/qbert.md", "environments/atari/riverraid.md", "environments/atari/road_runner.md", "environments/atari/robotank.md", "environments/atari/seaquest.md", "environments/atari/sir_lancelot.md", "environments/atari/skiing.md", "environments/atari/solaris.md", "environments/atari/space_invaders.md", "environments/atari/space_war.md", "environments/atari/star_gunner.md", "environments/atari/superman.md", "environments/atari/surround.md", "environments/atari/tennis.md", "environments/atari/tetris.md", "environments/atari/tic_tac_toe_3d.md", "environments/atari/time_pilot.md", "environments/atari/trondead.md", "environments/atari/turmoil.md", "environments/atari/tutankham.md", "environments/atari/up_n_down.md", "environments/atari/venture.md", "environments/atari/video_checkers.md", "environments/atari/video_chess.md", "environments/atari/video_cube.md", "environments/atari/video_pinball.md", "environments/atari/wizard_of_wor.md", "environments/atari/word_zapper.md", "environments/atari/yars_revenge.md", "environments/atari/zaxxon.md", "environments/box2d.md", "environments/box2d/bipedal_walker.md", "environments/box2d/car_racing.md", "environments/box2d/lunar_lander.md", "environments/classic_control.md", "environments/classic_control/acrobot.md", "environments/classic_control/cart_pole.md", "environments/classic_control/mountain_car.md", "environments/classic_control/mountain_car_continuous.md", "environments/classic_control/pendulum.md", "environments/mujoco.md", "environments/mujoco/ant.md", "environments/mujoco/half_cheetah.md", "environments/mujoco/hopper.md", "environments/mujoco/humanoid.md", "environments/mujoco/humanoid_standup.md", "environments/mujoco/inverted_double_pendulum.md", "environments/mujoco/inverted_pendulum.md", "environments/mujoco/pusher.md", "environments/mujoco/reacher.md", "environments/mujoco/swimmer.md", "environments/mujoco/walker2d.md", "environments/third_party_environments.md", "environments/toy_text.md", "environments/toy_text/blackjack.md", "environments/toy_text/cliff_walking.md", "environments/toy_text/cliff_walking_slippery.md", "environments/toy_text/frozen_lake.md", "environments/toy_text/taxi.md", "gym_release_notes/index.md", "gymnasium_release_notes/index.md", "index.md", "introduction/basic_usage.md", "introduction/create_custom_env.md", "introduction/migration_guide.md", "introduction/record_agent.md", "introduction/speed_up_env.md", "introduction/train_agent.md", "tutorials/gymnasium_basics/README.rst", "tutorials/gymnasium_basics/environment_creation.rst", "tutorials/gymnasium_basics/handling_time_limits.rst", "tutorials/gymnasium_basics/implementing_custom_wrappers.rst", "tutorials/gymnasium_basics/index.rst", "tutorials/gymnasium_basics/load_quadruped_model.rst", "tutorials/index.rst", "tutorials/third-party-tutorials.md", "tutorials/training_agents/README.rst", "tutorials/training_agents/action_masking_taxi.rst", "tutorials/training_agents/blackjack_q_learning.rst", "tutorials/training_agents/frozenlake_q_learning.rst", "tutorials/training_agents/index.rst", "tutorials/training_agents/mujoco_reinforce.rst", "tutorials/training_agents/vector_a2c.rst"], "indexentries": {"action() (gymnasium.actionwrapper method)": [[16, "gymnasium.ActionWrapper.action", false]], "action_space (gymnasium.env attribute)": [[2, "gymnasium.Env.action_space", false]], "action_space (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.action_space", false]], "action_space (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.action_space", false]], "actions() (gymnasium.vector.vectoractionwrapper method)": [[14, "gymnasium.vector.VectorActionWrapper.actions", false]], "actionwrapper (class in gymnasium)": [[16, "gymnasium.ActionWrapper", false]], "addrenderobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.AddRenderObservation", false]], "arrayconversion (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.ArrayConversion", false]], "arrayconversion (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ArrayConversion", false]], "asyncvectorenv (class in gymnasium.vector)": [[11, "gymnasium.vector.AsyncVectorEnv", false]], "ataripreprocessing (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.AtariPreprocessing", false]], "autoreset (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.Autoreset", false]], "batch_space() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.batch_space", false]], "benchmark_init() (in module gymnasium.utils.performance)": [[9, "gymnasium.utils.performance.benchmark_init", false]], "benchmark_render() (in module gymnasium.utils.performance)": [[9, "gymnasium.utils.performance.benchmark_render", false]], "benchmark_step() (in module gymnasium.utils.performance)": [[9, "gymnasium.utils.performance.benchmark_step", false]], "box (class in gymnasium.spaces)": [[7, "gymnasium.spaces.Box", false]], "call() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.call", false]], "call() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.call", false]], "callback() (gymnasium.utils.play.playplot method)": [[9, "gymnasium.utils.play.PlayPlot.callback", false]], "capped_cubic_video_schedule() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.capped_cubic_video_schedule", false]], "check_env() (in module gymnasium.utils.env_checker)": [[9, "gymnasium.utils.env_checker.check_env", false]], "clear_mpi_env_vars() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.clear_mpi_env_vars", false]], "clipaction (class in gymnasium.wrappers)": [[16, "gymnasium.wrappers.ClipAction", false]], "clipaction (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ClipAction", false]], "clipreward (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.ClipReward", false]], "clipreward (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ClipReward", false]], "close() (gymnasium.env method)": [[2, "gymnasium.Env.close", false]], "close() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.close", false]], "close() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.close", false]], "close() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.close", false]], "close() (gymnasium.vector.vectorwrapper method)": [[14, "gymnasium.vector.VectorWrapper.close", false]], "close() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.close", false]], "closed (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.closed", false]], "cloudpicklewrapper() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.CloudpickleWrapper", false]], "concatenate() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.concatenate", false]], "contains() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.contains", false]], "convert_to_done_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_done_step_api", false]], "convert_to_terminated_truncated_step_api() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.convert_to_terminated_truncated_step_api", false]], "create_empty_array() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.create_empty_array", false]], "create_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.create_shared_memory", false]], "current_namespace (gymnasium.envs.registration attribute)": [[4, "gymnasium.envs.registration.current_namespace", false]], "delayobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.DelayObservation", false]], "dict (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Dict", false]], "dictinfotolist (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.DictInfoToList", false]], "discrete (class in gymnasium.spaces)": [[7, "gymnasium.spaces.Discrete", false]], "dtype (gymnasium.spaces.space property)": [[5, "gymnasium.spaces.Space.dtype", false]], "dtypeobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.DtypeObservation", false]], "dtypeobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.DtypeObservation", false]], "env (class in gymnasium)": [[2, "gymnasium.Env", false]], "env (gymnasium.wrapper attribute)": [[15, "gymnasium.Wrapper.env", false]], "envspec (class in gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.EnvSpec", false]], "ezpickle (class in gymnasium.utils.ezpickle)": [[9, "gymnasium.utils.ezpickle.EzPickle", false]], "filterobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.FilterObservation", false]], "filterobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.FilterObservation", false]], "find_highest_version() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.find_highest_version", false]], "flatdim() (in module gymnasium.spaces.utils)": [[8, "gymnasium.spaces.utils.flatdim", false]], "flatten() (in module gymnasium.spaces.utils)": [[8, "gymnasium.spaces.utils.flatten", false]], "flatten_space() (in module gymnasium.spaces.utils)": [[8, "gymnasium.spaces.utils.flatten_space", false]], "flattenobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.FlattenObservation", false]], "flattenobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.FlattenObservation", false]], "framestackobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.FrameStackObservation", false]], "from_jsonable() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.from_jsonable", false]], "funcenv (class in gymnasium.experimental.functional)": [[3, "gymnasium.experimental.functional.FuncEnv", false]], "functionaljaxenv (class in gymnasium.envs.functional_jax_env)": [[3, "gymnasium.envs.functional_jax_env.FunctionalJaxEnv", false]], "get_attr() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.get_attr", false]], "get_attr() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.get_attr", false]], "get_env_id() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.get_env_id", false]], "get_wrapper_attr() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.get_wrapper_attr", false]], "graph (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Graph", false]], "grayscaleobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.GrayscaleObservation", false]], "grayscaleobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.GrayscaleObservation", false]], "gymnasium.spaces": [[5, "module-gymnasium.spaces", false]], "gymnasium.wrappers": [[15, "module-gymnasium.wrappers", false]], "humanrendering (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.HumanRendering", false]], "initial() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.initial", false]], "is_bounded() (gymnasium.spaces.box method)": [[7, "gymnasium.spaces.Box.is_bounded", false]], "is_np_flattenable (gymnasium.spaces.space property)": [[5, "gymnasium.spaces.Space.is_np_flattenable", false]], "iterate() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.iterate", false]], "jaxtonumpy (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.JaxToNumpy", false]], "jaxtonumpy (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.JaxToNumpy", false]], "jaxtotorch (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.JaxToTorch", false]], "jaxtotorch (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.JaxToTorch", false]], "load_env_creator() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.load_env_creator", false]], "make() (in module gymnasium)": [[4, "gymnasium.make", false]], "make_vec() (in module gymnasium)": [[4, "gymnasium.make_vec", false]], "maxandskipobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.MaxAndSkipObservation", false]], "metadata (gymnasium.env attribute)": [[2, "gymnasium.Env.metadata", false]], "metadata (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.metadata", false]], "metadata (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.metadata", false]], "module": [[5, "module-gymnasium.spaces", false], [15, "module-gymnasium.wrappers", false]], "multibinary (class in gymnasium.spaces)": [[7, "gymnasium.spaces.MultiBinary", false]], "multidiscrete (class in gymnasium.spaces)": [[7, "gymnasium.spaces.MultiDiscrete", false]], "namespace() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.namespace", false]], "normalizeobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.NormalizeObservation", false]], "normalizeobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.NormalizeObservation", false]], "normalizereward (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.NormalizeReward", false]], "normalizereward (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.NormalizeReward", false]], "np_random (gymnasium.env property)": [[2, "gymnasium.Env.np_random", false]], "np_random (gymnasium.spaces.space property)": [[5, "gymnasium.spaces.Space.np_random", false]], "np_random (gymnasium.vector.asyncvectorenv property)": [[11, "gymnasium.vector.AsyncVectorEnv.np_random", false]], "np_random (gymnasium.vector.syncvectorenv property)": [[12, "gymnasium.vector.SyncVectorEnv.np_random", false]], "np_random (gymnasium.vector.vectorenv property)": [[10, "gymnasium.vector.VectorEnv.np_random", false]], "np_random (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.np_random", false]], "np_random() (in module gymnasium.utils.seeding)": [[9, "gymnasium.utils.seeding.np_random", false]], "np_random_seed (gymnasium.env property)": [[2, "gymnasium.Env.np_random_seed", false]], "np_random_seed (gymnasium.vector.asyncvectorenv property)": [[11, "gymnasium.vector.AsyncVectorEnv.np_random_seed", false]], "np_random_seed (gymnasium.vector.syncvectorenv property)": [[12, "gymnasium.vector.SyncVectorEnv.np_random_seed", false]], "np_random_seed (gymnasium.vector.vectorenv property)": [[10, "gymnasium.vector.VectorEnv.np_random_seed", false]], "np_random_seed (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.np_random_seed", false]], "num_envs (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.num_envs", false]], "numpytotorch (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.NumpyToTorch", false]], "numpytotorch (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.NumpyToTorch", false]], "observation() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.observation", false]], "observation() (gymnasium.observationwrapper method)": [[18, "gymnasium.ObservationWrapper.observation", false]], "observation_space (gymnasium.env attribute)": [[2, "gymnasium.Env.observation_space", false]], "observation_space (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.observation_space", false]], "observation_space (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.observation_space", false]], "observations() (gymnasium.vector.vectorobservationwrapper method)": [[14, "gymnasium.vector.VectorObservationWrapper.observations", false]], "observationwrapper (class in gymnasium)": [[18, "gymnasium.ObservationWrapper", false]], "oneof (class in gymnasium.spaces)": [[6, "gymnasium.spaces.OneOf", false]], "orderenforcing (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.OrderEnforcing", false]], "parse_env_id() (in module gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.parse_env_id", false]], "passiveenvchecker (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.PassiveEnvChecker", false]], "play() (in module gymnasium.utils.play)": [[9, "gymnasium.utils.play.play", false]], "playablegame (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayableGame", false]], "playplot (class in gymnasium.utils.play)": [[9, "gymnasium.utils.play.PlayPlot", false]], "pprint_registry() (in module gymnasium)": [[4, "gymnasium.pprint_registry", false]], "process_event() (gymnasium.utils.play.playablegame method)": [[9, "gymnasium.utils.play.PlayableGame.process_event", false]], "read_from_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.read_from_shared_memory", false]], "recordepisodestatistics (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.RecordEpisodeStatistics", false]], "recordepisodestatistics (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.RecordEpisodeStatistics", false]], "recordvideo (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.RecordVideo", false]], "register() (in module gymnasium)": [[4, "gymnasium.register", false]], "registry (gymnasium.envs.registration attribute)": [[4, "gymnasium.envs.registration.registry", false]], "render() (gymnasium.env method)": [[2, "gymnasium.Env.render", false]], "render() (gymnasium.envs.functional_jax_env.functionaljaxenv method)": [[3, "gymnasium.envs.functional_jax_env.FunctionalJaxEnv.render", false]], "render() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.render", false]], "render() (gymnasium.vector.vectorwrapper method)": [[14, "gymnasium.vector.VectorWrapper.render", false]], "render() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.render", false]], "render_close() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.render_close", false]], "render_image() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.render_image", false]], "render_init() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.render_init", false]], "render_mode (gymnasium.env attribute)": [[2, "gymnasium.Env.render_mode", false]], "render_mode (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.render_mode", false]], "rendercollection (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.RenderCollection", false]], "rescaleaction (class in gymnasium.wrappers)": [[16, "gymnasium.wrappers.RescaleAction", false]], "rescaleaction (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.RescaleAction", false]], "rescaleobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.RescaleObservation", false]], "rescaleobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.RescaleObservation", false]], "reset() (gymnasium.env method)": [[2, "gymnasium.Env.reset", false]], "reset() (gymnasium.envs.functional_jax_env.functionaljaxenv method)": [[3, "gymnasium.envs.functional_jax_env.FunctionalJaxEnv.reset", false]], "reset() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.reset", false]], "reset() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.reset", false]], "reset() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.reset", false]], "reset() (gymnasium.vector.vectorwrapper method)": [[14, "gymnasium.vector.VectorWrapper.reset", false]], "reset() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.reset", false]], "reshapeobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.ReshapeObservation", false]], "reshapeobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ReshapeObservation", false]], "resizeobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.ResizeObservation", false]], "resizeobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.ResizeObservation", false]], "reward() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.reward", false]], "reward() (gymnasium.rewardwrapper method)": [[19, "gymnasium.RewardWrapper.reward", false]], "rewards() (gymnasium.vector.vectorrewardwrapper method)": [[14, "gymnasium.vector.VectorRewardWrapper.rewards", false]], "rewardwrapper (class in gymnasium)": [[19, "gymnasium.RewardWrapper", false]], "sample() (gymnasium.spaces.box method)": [[7, "gymnasium.spaces.Box.sample", false]], "sample() (gymnasium.spaces.dict method)": [[6, "gymnasium.spaces.Dict.sample", false]], "sample() (gymnasium.spaces.discrete method)": [[7, "gymnasium.spaces.Discrete.sample", false]], "sample() (gymnasium.spaces.graph method)": [[6, "gymnasium.spaces.Graph.sample", false]], "sample() (gymnasium.spaces.multibinary method)": [[7, "gymnasium.spaces.MultiBinary.sample", false]], "sample() (gymnasium.spaces.multidiscrete method)": [[7, "gymnasium.spaces.MultiDiscrete.sample", false]], "sample() (gymnasium.spaces.oneof method)": [[6, "gymnasium.spaces.OneOf.sample", false]], "sample() (gymnasium.spaces.sequence method)": [[6, "gymnasium.spaces.Sequence.sample", false]], "sample() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.sample", false]], "sample() (gymnasium.spaces.text method)": [[7, "gymnasium.spaces.Text.sample", false]], "sample() (gymnasium.spaces.tuple method)": [[6, "gymnasium.spaces.Tuple.sample", false]], "save_video() (in module gymnasium.utils.save_video)": [[9, "gymnasium.utils.save_video.save_video", false]], "seed() (gymnasium.spaces.box method)": [[7, "gymnasium.spaces.Box.seed", false]], "seed() (gymnasium.spaces.dict method)": [[6, "gymnasium.spaces.Dict.seed", false]], "seed() (gymnasium.spaces.discrete method)": [[7, "gymnasium.spaces.Discrete.seed", false]], "seed() (gymnasium.spaces.graph method)": [[6, "gymnasium.spaces.Graph.seed", false]], "seed() (gymnasium.spaces.multibinary method)": [[7, "gymnasium.spaces.MultiBinary.seed", false]], "seed() (gymnasium.spaces.multidiscrete method)": [[7, "gymnasium.spaces.MultiDiscrete.seed", false]], "seed() (gymnasium.spaces.oneof method)": [[6, "gymnasium.spaces.OneOf.seed", false]], "seed() (gymnasium.spaces.sequence method)": [[6, "gymnasium.spaces.Sequence.seed", false]], "seed() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.seed", false]], "seed() (gymnasium.spaces.text method)": [[7, "gymnasium.spaces.Text.seed", false]], "seed() (gymnasium.spaces.tuple method)": [[6, "gymnasium.spaces.Tuple.seed", false]], "sequence (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Sequence", false]], "set_attr() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.set_attr", false]], "set_attr() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.set_attr", false]], "set_wrapper_attr() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.set_wrapper_attr", false]], "shape (gymnasium.spaces.space property)": [[5, "gymnasium.spaces.Space.shape", false]], "single_action_space (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.single_action_space", false]], "single_observation_space (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.single_observation_space", false]], "space (class in gymnasium.spaces)": [[5, "gymnasium.spaces.Space", false]], "spec (gymnasium.env attribute)": [[2, "gymnasium.Env.spec", false]], "spec (gymnasium.vector.vectorenv attribute)": [[10, "gymnasium.vector.VectorEnv.spec", false]], "spec (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.spec", false]], "spec() (in module gymnasium)": [[4, "gymnasium.spec", false]], "state_info() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.state_info", false]], "step() (gymnasium.env method)": [[2, "gymnasium.Env.step", false]], "step() (gymnasium.envs.functional_jax_env.functionaljaxenv method)": [[3, "gymnasium.envs.functional_jax_env.FunctionalJaxEnv.step", false]], "step() (gymnasium.vector.asyncvectorenv method)": [[11, "gymnasium.vector.AsyncVectorEnv.step", false]], "step() (gymnasium.vector.syncvectorenv method)": [[12, "gymnasium.vector.SyncVectorEnv.step", false]], "step() (gymnasium.vector.vectorenv method)": [[10, "gymnasium.vector.VectorEnv.step", false]], "step() (gymnasium.vector.vectorwrapper method)": [[14, "gymnasium.vector.VectorWrapper.step", false]], "step() (gymnasium.wrapper method)": [[15, "gymnasium.Wrapper.step", false]], "step_api_compatibility() (in module gymnasium.utils.step_api_compatibility)": [[9, "gymnasium.utils.step_api_compatibility.step_api_compatibility", false]], "stickyaction (class in gymnasium.wrappers)": [[16, "gymnasium.wrappers.StickyAction", false]], "syncvectorenv (class in gymnasium.vector)": [[12, "gymnasium.vector.SyncVectorEnv", false]], "terminal() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.terminal", false]], "text (class in gymnasium.spaces)": [[7, "gymnasium.spaces.Text", false]], "timeawareobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.TimeAwareObservation", false]], "timelimit (class in gymnasium.wrappers)": [[17, "gymnasium.wrappers.TimeLimit", false]], "to_jsonable() (gymnasium.spaces.space method)": [[5, "gymnasium.spaces.Space.to_jsonable", false]], "transform() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.transform", false]], "transformaction (class in gymnasium.wrappers)": [[16, "gymnasium.wrappers.TransformAction", false]], "transformaction (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.TransformAction", false]], "transformobservation (class in gymnasium.wrappers)": [[18, "gymnasium.wrappers.TransformObservation", false]], "transformobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.TransformObservation", false]], "transformreward (class in gymnasium.wrappers)": [[19, "gymnasium.wrappers.TransformReward", false]], "transformreward (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.TransformReward", false]], "transition() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.transition", false]], "transition_info() (gymnasium.experimental.functional.funcenv method)": [[3, "gymnasium.experimental.functional.FuncEnv.transition_info", false]], "tuple (class in gymnasium.spaces)": [[6, "gymnasium.spaces.Tuple", false]], "unflatten() (in module gymnasium.spaces.utils)": [[8, "gymnasium.spaces.utils.unflatten", false]], "unwrapped (gymnasium.env property)": [[2, "gymnasium.Env.unwrapped", false]], "unwrapped (gymnasium.vector.vectorenv property)": [[10, "gymnasium.vector.VectorEnv.unwrapped", false]], "unwrapped (gymnasium.wrapper property)": [[15, "gymnasium.Wrapper.unwrapped", false]], "vectoractionwrapper (class in gymnasium.vector)": [[14, "gymnasium.vector.VectorActionWrapper", false]], "vectorenv (class in gymnasium.vector)": [[10, "gymnasium.vector.VectorEnv", false]], "vectorizetransformaction (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.VectorizeTransformAction", false]], "vectorizetransformobservation (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.VectorizeTransformObservation", false]], "vectorizetransformreward (class in gymnasium.wrappers.vector)": [[14, "gymnasium.wrappers.vector.VectorizeTransformReward", false]], "vectorobservationwrapper (class in gymnasium.vector)": [[14, "gymnasium.vector.VectorObservationWrapper", false]], "vectorrewardwrapper (class in gymnasium.vector)": [[14, "gymnasium.vector.VectorRewardWrapper", false]], "vectorwrapper (class in gymnasium.vector)": [[14, "gymnasium.vector.VectorWrapper", false]], "wrapper (class in gymnasium)": [[15, "gymnasium.Wrapper", false]], "wrapper_spec() (gymnasium.wrapper class method)": [[15, "gymnasium.Wrapper.wrapper_spec", false]], "wrapperspec (class in gymnasium.envs.registration)": [[4, "gymnasium.envs.registration.WrapperSpec", false]], "write_to_shared_memory() (in module gymnasium.vector.utils)": [[13, "gymnasium.vector.utils.write_to_shared_memory", false]]}, "objects": {"gymnasium": [[16, 0, 1, "", "ActionWrapper"], [2, 0, 1, "", "Env"], [18, 0, 1, "", "ObservationWrapper"], [19, 0, 1, "", "RewardWrapper"], [15, 0, 1, "", "Wrapper"], [4, 4, 1, "", "make"], [4, 4, 1, "", "make_vec"], [4, 4, 1, "", "pprint_registry"], [4, 4, 1, "", "register"], [5, 5, 0, "-", "spaces"], [4, 4, 1, "", "spec"], [15, 5, 0, "-", "wrappers"]], "gymnasium.ActionWrapper": [[16, 1, 1, "", "action"]], "gymnasium.Env": [[2, 2, 1, "", "action_space"], [2, 1, 1, "", "close"], [2, 2, 1, "", "metadata"], [2, 3, 1, "", "np_random"], [2, 3, 1, "", "np_random_seed"], [2, 2, 1, "", "observation_space"], [2, 1, 1, "", "render"], [2, 2, 1, "", "render_mode"], [2, 1, 1, "", "reset"], [2, 2, 1, "", "spec"], [2, 1, 1, "", "step"], [2, 3, 1, "", "unwrapped"]], "gymnasium.ObservationWrapper": [[18, 1, 1, "", "observation"]], "gymnasium.RewardWrapper": [[19, 1, 1, "", "reward"]], "gymnasium.Wrapper": [[15, 3, 1, "", "action_space"], [15, 1, 1, "", "close"], [15, 2, 1, "", "env"], [15, 1, 1, "", "get_wrapper_attr"], [15, 3, 1, "", "metadata"], [15, 3, 1, "", "np_random"], [15, 3, 1, "", "np_random_seed"], [15, 3, 1, "", "observation_space"], [15, 1, 1, "", "render"], [15, 1, 1, "", "reset"], [15, 1, 1, "", "set_wrapper_attr"], [15, 3, 1, "", "spec"], [15, 1, 1, "", "step"], [15, 3, 1, "", "unwrapped"], [15, 1, 1, "", "wrapper_spec"]], "gymnasium.envs.functional_jax_env": [[3, 0, 1, "", "FunctionalJaxEnv"]], "gymnasium.envs.functional_jax_env.FunctionalJaxEnv": [[3, 1, 1, "", "render"], [3, 1, 1, "", "reset"], [3, 1, 1, "", "step"]], "gymnasium.envs.registration": [[4, 0, 1, "", "EnvSpec"], [4, 0, 1, "", "WrapperSpec"], [4, 2, 1, "", "current_namespace"], [4, 4, 1, "", "find_highest_version"], [4, 4, 1, "", "get_env_id"], [4, 4, 1, "", "load_env_creator"], [4, 4, 1, "", "namespace"], [4, 4, 1, "", "parse_env_id"], [4, 2, 1, "", "registry"]], "gymnasium.experimental.functional": [[3, 0, 1, "", "FuncEnv"]], "gymnasium.experimental.functional.FuncEnv": [[3, 1, 1, "", "initial"], [3, 1, 1, "", "observation"], [3, 1, 1, "", "render_close"], [3, 1, 1, "", "render_image"], [3, 1, 1, "", "render_init"], [3, 1, 1, "", "reward"], [3, 1, 1, "", "state_info"], [3, 1, 1, "", "terminal"], [3, 1, 1, "", "transform"], [3, 1, 1, "", "transition"], [3, 1, 1, "", "transition_info"]], "gymnasium.spaces": [[7, 0, 1, "", "Box"], [6, 0, 1, "", "Dict"], [7, 0, 1, "", "Discrete"], [6, 0, 1, "", "Graph"], [7, 0, 1, "", "MultiBinary"], [7, 0, 1, "", "MultiDiscrete"], [6, 0, 1, "", "OneOf"], [6, 0, 1, "", "Sequence"], [5, 0, 1, "", "Space"], [7, 0, 1, "", "Text"], [6, 0, 1, "", "Tuple"]], "gymnasium.spaces.Box": [[7, 1, 1, "", "is_bounded"], [7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.Dict": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.Discrete": [[7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.Graph": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.MultiBinary": [[7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.MultiDiscrete": [[7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.OneOf": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.Sequence": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.Space": [[5, 1, 1, "", "contains"], [5, 3, 1, "", "dtype"], [5, 1, 1, "", "from_jsonable"], [5, 3, 1, "", "is_np_flattenable"], [5, 3, 1, "", "np_random"], [5, 1, 1, "", "sample"], [5, 1, 1, "", "seed"], [5, 3, 1, "", "shape"], [5, 1, 1, "", "to_jsonable"]], "gymnasium.spaces.Text": [[7, 1, 1, "", "sample"], [7, 1, 1, "", "seed"]], "gymnasium.spaces.Tuple": [[6, 1, 1, "", "sample"], [6, 1, 1, "", "seed"]], "gymnasium.spaces.utils": [[8, 4, 1, "", "flatdim"], [8, 4, 1, "", "flatten"], [8, 4, 1, "", "flatten_space"], [8, 4, 1, "", "unflatten"]], "gymnasium.utils.env_checker": [[9, 4, 1, "", "check_env"]], "gymnasium.utils.ezpickle": [[9, 0, 1, "", "EzPickle"]], "gymnasium.utils.performance": [[9, 4, 1, "", "benchmark_init"], [9, 4, 1, "", "benchmark_render"], [9, 4, 1, "", "benchmark_step"]], "gymnasium.utils.play": [[9, 0, 1, "", "PlayPlot"], [9, 0, 1, "", "PlayableGame"], [9, 4, 1, "", "play"]], "gymnasium.utils.play.PlayPlot": [[9, 1, 1, "", "callback"]], "gymnasium.utils.play.PlayableGame": [[9, 1, 1, "", "process_event"]], "gymnasium.utils.save_video": [[9, 4, 1, "", "capped_cubic_video_schedule"], [9, 4, 1, "", "save_video"]], "gymnasium.utils.seeding": [[9, 4, 1, "", "np_random"]], "gymnasium.utils.step_api_compatibility": [[9, 4, 1, "", "convert_to_done_step_api"], [9, 4, 1, "", "convert_to_terminated_truncated_step_api"], [9, 4, 1, "", "step_api_compatibility"]], "gymnasium.vector": [[11, 0, 1, "", "AsyncVectorEnv"], [12, 0, 1, "", "SyncVectorEnv"], [14, 0, 1, "", "VectorActionWrapper"], [10, 0, 1, "", "VectorEnv"], [14, 0, 1, "", "VectorObservationWrapper"], [14, 0, 1, "", "VectorRewardWrapper"], [14, 0, 1, "", "VectorWrapper"]], "gymnasium.vector.AsyncVectorEnv": [[11, 1, 1, "", "call"], [11, 1, 1, "", "close"], [11, 1, 1, "", "get_attr"], [11, 3, 1, "", "np_random"], [11, 3, 1, "", "np_random_seed"], [11, 1, 1, "", "reset"], [11, 1, 1, "", "set_attr"], [11, 1, 1, "", "step"]], "gymnasium.vector.SyncVectorEnv": [[12, 1, 1, "", "call"], [12, 1, 1, "", "close"], [12, 1, 1, "", "get_attr"], [12, 3, 1, "", "np_random"], [12, 3, 1, "", "np_random_seed"], [12, 1, 1, "", "reset"], [12, 1, 1, "", "set_attr"], [12, 1, 1, "", "step"]], "gymnasium.vector.VectorActionWrapper": [[14, 1, 1, "", "actions"]], "gymnasium.vector.VectorEnv": [[10, 2, 1, "", "action_space"], [10, 1, 1, "", "close"], [10, 2, 1, "", "closed"], [10, 2, 1, "", "metadata"], [10, 3, 1, "", "np_random"], [10, 3, 1, "", "np_random_seed"], [10, 2, 1, "", "num_envs"], [10, 2, 1, "", "observation_space"], [10, 1, 1, "", "render"], [10, 2, 1, "", "render_mode"], [10, 1, 1, "", "reset"], [10, 2, 1, "", "single_action_space"], [10, 2, 1, "", "single_observation_space"], [10, 2, 1, "", "spec"], [10, 1, 1, "", "step"], [10, 3, 1, "", "unwrapped"]], "gymnasium.vector.VectorObservationWrapper": [[14, 1, 1, "", "observations"]], "gymnasium.vector.VectorRewardWrapper": [[14, 1, 1, "", "rewards"]], "gymnasium.vector.VectorWrapper": [[14, 1, 1, "", "close"], [14, 1, 1, "", "render"], [14, 1, 1, "", "reset"], [14, 1, 1, "", "step"]], "gymnasium.vector.utils": [[13, 4, 1, "", "CloudpickleWrapper"], [13, 4, 1, "", "batch_space"], [13, 4, 1, "", "clear_mpi_env_vars"], [13, 4, 1, "", "concatenate"], [13, 4, 1, "", "create_empty_array"], [13, 4, 1, "", "create_shared_memory"], [13, 4, 1, "", "iterate"], [13, 4, 1, "", "read_from_shared_memory"], [13, 4, 1, "", "write_to_shared_memory"]], "gymnasium.wrappers": [[18, 0, 1, "", "AddRenderObservation"], [17, 0, 1, "", "ArrayConversion"], [17, 0, 1, "", "AtariPreprocessing"], [17, 0, 1, "", "Autoreset"], [16, 0, 1, "", "ClipAction"], [19, 0, 1, "", "ClipReward"], [18, 0, 1, "", "DelayObservation"], [18, 0, 1, "", "DtypeObservation"], [18, 0, 1, "", "FilterObservation"], [18, 0, 1, "", "FlattenObservation"], [18, 0, 1, "", "FrameStackObservation"], [18, 0, 1, "", "GrayscaleObservation"], [17, 0, 1, "", "HumanRendering"], [17, 0, 1, "", "JaxToNumpy"], [17, 0, 1, "", "JaxToTorch"], [18, 0, 1, "", "MaxAndSkipObservation"], [18, 0, 1, "", "NormalizeObservation"], [19, 0, 1, "", "NormalizeReward"], [17, 0, 1, "", "NumpyToTorch"], [17, 0, 1, "", "OrderEnforcing"], [17, 0, 1, "", "PassiveEnvChecker"], [17, 0, 1, "", "RecordEpisodeStatistics"], [17, 0, 1, "", "RecordVideo"], [17, 0, 1, "", "RenderCollection"], [16, 0, 1, "", "RescaleAction"], [18, 0, 1, "", "RescaleObservation"], [18, 0, 1, "", "ReshapeObservation"], [18, 0, 1, "", "ResizeObservation"], [16, 0, 1, "", "StickyAction"], [18, 0, 1, "", "TimeAwareObservation"], [17, 0, 1, "", "TimeLimit"], [16, 0, 1, "", "TransformAction"], [18, 0, 1, "", "TransformObservation"], [19, 0, 1, "", "TransformReward"]], "gymnasium.wrappers.vector": [[14, 0, 1, "", "ArrayConversion"], [14, 0, 1, "", "ClipAction"], [14, 0, 1, "", "ClipReward"], [14, 0, 1, "", "DictInfoToList"], [14, 0, 1, "", "DtypeObservation"], [14, 0, 1, "", "FilterObservation"], [14, 0, 1, "", "FlattenObservation"], [14, 0, 1, "", "GrayscaleObservation"], [14, 0, 1, "", "JaxToNumpy"], [14, 0, 1, "", "JaxToTorch"], [14, 0, 1, "", "NormalizeObservation"], [14, 0, 1, "", "NormalizeReward"], [14, 0, 1, "", "NumpyToTorch"], [14, 0, 1, "", "RecordEpisodeStatistics"], [14, 0, 1, "", "RescaleAction"], [14, 0, 1, "", "RescaleObservation"], [14, 0, 1, "", "ReshapeObservation"], [14, 0, 1, "", "ResizeObservation"], [14, 0, 1, "", "TransformAction"], [14, 0, 1, "", "TransformObservation"], [14, 0, 1, "", "TransformReward"], [14, 0, 1, "", "VectorizeTransformAction"], [14, 0, 1, "", "VectorizeTransformObservation"], [14, 0, 1, "", "VectorizeTransformReward"]]}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "method", "Python method"], "2": ["py", "attribute", "Python attribute"], "3": ["py", "property", "Python property"], "4": ["py", "function", "Python function"], "5": ["py", "module", "Python module"]}, "objtypes": {"0": "py:class", "1": "py:method", "2": "py:attribute", "3": "py:property", "4": "py:function", "5": "py:module"}, "terms": {"": [1, 2, 3, 5, 6, 7, 9, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 161, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "0": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 158, 159, 161, 163, 165, 166, 167, 173, 174, 175, 177, 178], "00": [2, 10, 18], "000": 163, "00000000e": [10, 18], "00048403": 14, "000635": [10, 14], "00080468": 14, "0008876301247721108": 19, "001": [133, 135, 140, 163, 174, 178], "00105192": 14, "00127": 14, "00133522": 14, "00142543": 14, "0015": 134, "002": [18, 139, 147, 169], "00209899": 14, "00214607": 11, "0025": [133, 134], "00266526": 14, "003": 140, "00372536": 14, "00395268": 14, "005": [144, 145, 178], "00529102": 14, "00545912": 14, "0059888": 18, "00611216": [10, 18], "00614867": 14, "00615723": 14, "00624371": 14, "00708": 6, "00711833": 6, "00715587": 14, "007812": 14, "008": [139, 147], "00848456": 10, "00942293": 10, "00987654": 158, "01": [2, 10, 14, 16, 18, 129, 137, 138, 141, 142, 143, 144, 145, 146, 155, 156, 159, 163, 169, 174, 178], "010162116476634746": 19, "01098382": [10, 14], "01162461": 10, "01234567": 158, "0123456789": 7, "0123456789abcdefghijklmnopqrstuvwxyzabcdefghijklmnopqrstuvwxyz": 7, "01431748": 10, "01456789": 158, "015": 140, "01522993": 10, "01734283": [10, 16], "01823519": [10, 14, 16, 18], "0197368": [10, 18], "02": [10, 18, 145, 155, 156, 163], "0203607": 16, "0219676": 14, "02345678": 158, "02418869": 10, "024251968": 14, "02438": 178, "02480598": [10, 14], "02727336": [10, 18], "02728892": 16, "0273956": [10, 18], "02796401": [10, 14, 16, 18], "02852531": [10, 14], "02858594": [10, 14], "02859527": [10, 16], "029028230434438706": 14, "02909703": 10, "03": [14, 129, 155, 156], "03156282": [10, 14, 16, 18], "03203924": [10, 14], "0333221090036294": 14, "03332211": 14, "03359492141887935": 14, "03392126": 10, "03516225": 10, "03517495": [10, 14], "03525399": 16, "03585979": [10, 18], "03625453": [10, 18], "03647037": 132, "03774345": 10, "03812904": 16, "03822722": 10, "04": [14, 16, 146, 155], "0446179": [10, 14, 16, 18], "04562247": 10, "0469136": [10, 14], "0469184": 10, "04731862": 10, "04740972": 10, "04794393": 16, "04799704": 10, "05": [14, 132, 137, 138, 141, 144, 155, 156, 163, 169], "055928": 14, "05592803": 132, "06": [155, 156], "06296527": 14, "06296527291998574": 14, "0631256": 14, "06312564": 132, "0640786": 14, "06540678": 18, "06670535": 16, "07": [133, 134, 155, 156], "07287608": 131, "07422512": 18, "08": [155, 156], "0808398": 11, "08227695": 18, "0892358": [14, 132], "09": [155, 156], "09417735": 13, "09613613": 18, "0_": [137, 138, 142, 144], "0_2": [144, 145], "0_3": 144, "0a2": 132, "0th": 17, "0x7f04efcb8850": 158, "0x7fbb5efd0490": 15, "1": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159, 161, 163, 165, 166, 167, 173, 174, 175, 177, 178], "10": [6, 7, 14, 17, 18, 127, 129, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 150, 151, 152, 154, 155, 156, 158, 159, 160, 161, 163, 165, 174, 177, 178], "100": [6, 8, 14, 17, 127, 128, 129, 131, 134, 139, 144, 148, 151, 152, 153, 161, 163, 169, 173], "1000": [9, 17, 128, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 157, 161, 163, 169, 177, 178], "1006": 156, "1009": 156, "100_000": [163, 174], "1013": 156, "10172354684460168": 14, "10172355": 14, "1018": 156, "1019": 156, "1027": 156, "1033": 156, "105": [137, 156], "107": 137, "1075": 156, "1086": 156, "1087": 156, "1094": 156, "1095": 156, "10_000": 161, "10th": 160, "10x": 174, "11": [14, 137, 138, 139, 140, 141, 144, 147, 150, 151, 152, 155, 174, 178], "110": 156, "1105": 156, "1107": 156, "1109": 156, "11185605": 131, "1119": 156, "112": 156, "1120": 156, "11448676": 14, "117": 156, "12": [8, 16, 17, 18, 129, 131, 132, 137, 138, 139, 140, 141, 144, 147, 151, 152, 156, 163, 173, 174, 178], "120": 178, "12224312": [11, 12], "1229": 156, "123": [2, 6, 10, 11, 14, 16, 17, 18, 19, 131, 132, 133, 134, 135, 156, 160, 175], "1230": 156, "124": 156, "1240": 156, "1243": 156, "125": 156, "1250": 156, "1253": 156, "125637": 6, "1260": 156, "12625128": 131, "1264": 156, "1271": 156, "128": 178, "1280": 136, "1283": 156, "1285": 156, "1288": 156, "1289": 156, "1291": 156, "1293": 156, "1294": 156, "1297": 156, "1299": 156, "13": [137, 138, 140, 141, 144, 147, 154, 155, 156], "130": [140, 141, 156], "1304": 156, "1306": 156, "1308": 156, "1310": 156, "1312": 156, "1315": 156, "1319": 156, "132": [151, 152, 156], "1328": 156, "1329": 156, "1333": 156, "1334": 156, "136": 156, "1361": 156, "1378": 156, "138": 156, "1387": 156, "139": 156, "1393": 156, "1396": 156, "14": [137, 138, 140, 141, 144, 147, 155, 156, 174], "141": 156, "1415927": 127, "143": 156, "145": 137, "1455": 17, "146": 156, "14995256": [11, 12], "15": [8, 16, 17, 18, 19, 129, 137, 138, 140, 141, 144, 147, 153, 161, 175, 178], "150": [9, 173], "1500": 155, "1506": 178, "15089367": [10, 16], "1511158": 18, "155": 156, "1598639586606745": 14, "16": [135, 137, 138, 140, 141, 144, 147, 153, 155, 156, 174, 177], "160": 156, "1600": 127, "1613": 154, "164": 156, "16717631": 10, "17": [137, 138, 140, 141, 144, 147, 150, 155], "17032": 156, "171": 156, "1710671": 10, "172": 156, "173": 156, "174": 156, "17752565": 131, "178": 156, "179": 156, "18": [18, 137, 138, 140, 141, 144, 147, 155], "1800": 175, "183": 156, "184": 156, "1851753": 11, "186": 156, "1878752": 12, "18847767": 10, "18879032e": [10, 18], "1887903e": 2, "18933342": 6, "19": [137, 140, 141, 144, 178], "190": 156, "19049619": 6, "1938739": 14, "195": [156, 169], "19559774": 10, "199": 9, "1990": [133, 134], "1995": 131, "1996": 131, "1_": 145, "1b15": 155, "1d": [158, 159, 177], "1e": [14, 18, 19, 139, 140, 141, 146, 147, 177], "1f": 161, "2": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 158, 159, 161, 163, 165, 166, 167, 173, 174, 175, 177, 178], "20": [129, 137, 140, 141, 144, 154, 156, 174, 175, 178], "200": [9, 17, 129, 131, 132, 133, 135, 153, 154, 156, 161], "2000": [9, 127, 154, 175], "2004": 177, "200th": 17, "2014": 128, "2016": 178, "2017": 155, "20172954": 18, "2018": [16, 17, 131, 155], "2019": 155, "2020": [148, 150, 151, 152], "2021": [136, 148, 155], "2022": [136, 155, 156], "2023": 156, "2024": 156, "2025": 156, "205": 156, "206": 156, "208": 156, "20946532": 14, "2095": 132, "21": [18, 19, 137, 140, 141, 144, 150, 156, 163, 174, 178], "210x180": 17, "215": 156, "216": 156, "21649833": 6, "218": 156, "219": 156, "21944423": 14, "22": [17, 137, 140, 141, 144, 156, 174], "220": 174, "221": 156, "223": 156, "224": 156, "225": 156, "227": 154, "229": 177, "23": [137, 140, 141, 144, 156, 161], "230": 156, "234": 156, "235": 156, "235794": 6, "2359734": 14, "238": 156, "24": [14, 17, 18, 127, 128, 129, 132, 137, 140, 141, 156, 174], "24002443": 10, "2407": 156, "241": 156, "244": 156, "24503504": 14, "2456": 155, "246": 156, "247": 156, "2487226": 10, "249": 156, "25": [2, 8, 10, 17, 19, 137, 139, 140, 141, 147, 154, 156, 161, 169], "250": [156, 161], "250th": 161, "252": 156, "2524": 155, "254": 156, "255": [17, 18, 128, 156, 165], "25533703": 18, "256": 177, "257": 156, "25715804": 10, "258": 156, "259": 156, "25g": 137, "26": [2, 17, 137, 140, 141, 166, 177], "26141977": 10, "264": 156, "264d": 169, "267": 156, "2671": 155, "2678": 155, "268": 156, "2684": 155, "27": [9, 19, 140, 141], "270": 156, "272": 156, "2736044": 135, "274": [131, 156], "274334": 131, "27648": [14, 18, 158], "277": 156, "278": 156, "27800309628058434": 14, "279": 156, "28": [14, 131, 140, 141], "281": 156, "282": 156, "2831855": 129, "284": 156, "29": [17, 140, 141, 155, 161], "2906": 155, "292": 156, "2d": [136, 145, 148, 159, 167], "2f": 161, "2gb": 155, "3": [2, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159, 161, 163, 165, 173, 174, 175, 177, 178], "30": [2, 9, 17, 140, 141, 154, 156], "300": [127, 154, 159, 165, 175], "3000": 9, "3016": 155, "303": 154, "3034542e": 14, "3036": 155, "3037": 155, "304": 156, "3040": 155, "3041": 155, "3044": 155, "3072": 155, "30759571": 169, "3076": 155, "3080": 155, "3083": 155, "31": [140, 141, 156], "3110827": 10, "3118435e": 14, "3152": 19, "3154": 19, "32": [18, 140, 141, 150, 177, 178], "321": 156, "323": [144, 156], "32351476": 18, "327": [137, 156], "329": 156, "33": [140, 141], "330": 156, "331": 156, "3319138": 10, "332": 156, "33293587": [10, 16], "333": 156, "337": 156, "338": 156, "339": 156, "34": [140, 141], "340": 156, "341": 156, "342": 156, "34641072": 16, "34756234": 16, "348": [140, 141], "35": [140, 141, 156], "350": [140, 141], "355": 156, "36": [6, 140, 141, 151, 152], "37": [140, 141, 156], "373": 156, "38": [140, 141], "39": [140, 141, 156], "3991573": 6, "3d": [136, 137, 140, 141, 148, 159, 174], "3f": 163, "3rd": 136, "3v3": 148, "4": [2, 6, 7, 8, 9, 10, 14, 16, 17, 18, 127, 128, 129, 131, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 156, 158, 159, 161, 163, 165, 167, 173, 174, 177], "40": [140, 141], "400": [18, 154], "403": 156, "404": [154, 156], "405": 156, "407": 156, "41": [140, 141, 156], "4123625": 135, "418": [132, 156, 158], "41887903": [10, 18, 132], "4189": 6, "42": [6, 7, 10, 11, 12, 13, 16, 18, 140, 141, 156, 157, 159, 160, 163, 178], "424": 156, "42683297": 14, "42884544": 14, "429": 156, "43": [140, 141, 163], "433": 156, "435": 156, "4351738": 14, "4354835e": 14, "43887845": 13, "44": [6, 140, 141], "440": 156, "444": 156, "44504836": 14, "44799727": 14, "4488689e": 14, "45": [134, 144, 163], "450": 156, "451": 156, "459": 156, "4624777": 14, "46352962": [14, 133], "46515748": 14, "46543318": 14, "46546045": 14, "46553135": 14, "47": [151, 152], "47037": 6, "47377947": 14, "474": 156, "47599354": 14, "47de": 169, "48": [151, 152, 163], "480": 136, "4808415e": 16, "482": 156, "48468155": 14, "48657528": 14, "487": 156, "49": 163, "491": 156, "495": 156, "497": 156, "498371": 14, "4x12": [151, 152], "4x4": 153, "4\u03c0": 131, "5": [6, 7, 8, 9, 10, 13, 14, 16, 17, 18, 19, 127, 128, 129, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 154, 159, 163, 165, 173, 174, 175, 177, 178], "50": [17, 129, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 163, 177], "500": [17, 18, 131, 132, 154, 155, 158, 161, 163, 174, 178], "5000": 173, "503": 156, "51": [6, 156], "510": 156, "512": [156, 165], "515": 156, "516": 156, "518": 156, "520": 156, "522": 156, "524": 156, "525": 156, "5281": 156, "529": 156, "533": 156, "5342437e": 14, "535": 156, "536": 156, "538": 156, "54": 6, "540": 156, "5420062": 16, "548": 156, "55": [6, 156], "553": 156, "554": 156, "557": 156, "558": 156, "561": 156, "5635296": 134, "564": 156, "566371": 131, "567": 131, "5676788": 18, "569": 156, "57": 178, "572": 156, "573": 156, "576": 156, "5760367": [11, 12], "58": 156, "580": 156, "581": 156, "583": 156, "5836242": 6, "588": 156, "589": 156, "58922320": 173, "590": 156, "594091": 6, "5e": [137, 139, 140, 141, 147, 169], "5e3": 177, "5gb": 155, "5x": 156, "5x5": [154, 159], "6": [8, 14, 16, 17, 18, 129, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 151, 152, 154, 156, 161, 173, 177], "60": [8, 156], "600": [18, 178], "604": 156, "608": 156, "61": 156, "6102389": 12, "612": 156, "6120394": 18, "616": 156, "6193494": 11, "62": [6, 11, 12], "62259156": 14, "63": [6, 7], "63214064": 6, "634": 156, "6343064e": 14, "6344974": 16, "635": 156, "6382770e": 16, "639": 154, "6397772e": 16, "64": [6, 156], "6608303": 16, "666": 129, "669": 6, "67": 161, "6822636": 6, "683": 156, "68512": 6, "695": 156, "697368": 13, "6fn5ja9uzquzxgkvpwtqjz1eyjcs3hj3": 169, "7": [7, 9, 129, 134, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 156, 169, 178], "70": 156, "708": 156, "709": 156, "714599": 11, "7183299": 18, "72": 156, "720": 136, "7257502": 6, "729": 9, "73": 156, "731": 156, "732": 128, "74": 156, "748": 156, "75": [16, 137, 169], "75cm": 137, "76": 161, "7619033": 14, "762": 156, "7695615": 12, "77": 6, "77395606": 13, "774": 156, "78": [137, 140, 141, 156, 161], "7851154": 11, "788": 156, "789": 156, "791": 156, "79221743": 12, "8": [6, 9, 10, 14, 18, 19, 128, 129, 131, 132, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 153, 155, 156, 158, 159, 173, 175, 177, 178], "80": [153, 154], "800": [156, 175], "8000": 1, "80000019": [10, 18], "80000019e": [10, 18], "8000002e": 2, "801": 156, "81": [11, 12, 135, 156], "810": 156, "811": 156, "812": 156, "8127025": 156, "8127026": 156, "817": 156, "8174238": [11, 12], "81882": 6, "827": 156, "83": 156, "830": 156, "83506": 6, "838": 156, "84": [6, 17], "8498053": 12, "84x84": 17, "85859793": 13, "867": 156, "886": 156, "889": 156, "88g": 137, "89": [6, 156], "8914354": 18, "89235795": 135, "893": 156, "89345848": 14, "8934584807363618": 14, "8971417e": 14, "898": 156, "8f1d43620bc6bb580df6e80b0dc05c48": 131, "8gb": 155, "8x8": 153, "9": [11, 12, 14, 16, 131, 135, 137, 138, 139, 140, 141, 142, 144, 145, 147, 156, 174, 178], "90": 174, "9053838": 6, "9061728": 14, "90849805": 14, "910": 137, "91101986": 135, "91244936": [11, 12], "915": 156, "91g": 137, "9216": 14, "924": 156, "926": [128, 156], "928024": 6, "9296501": 14, "932": 156, "934": 156, "9375233e": 14, "9380709": 16, "941": 156, "9416149": 14, "9428282": 14, "9429494": 14, "95": [128, 163, 173, 174, 175, 178], "9503881": 14, "950912": 6, "952": 156, "9532328e": 14, "956": 156, "957": 156, "958": 156, "959": 156, "96": [14, 18, 128, 158], "9635296": 14, "96495728": 11, "965": 156, "96562607": 12, "96x96": [128, 158], "97562236": 13, "977": 156, "978": 156, "97854": 6, "979": 156, "9808417e": 16, "982": 156, "98219293": 12, "98270553": 11, "9841162": 131, "9886932": [11, 12], "9898634e": 14, "99": [14, 19, 177, 178], "9944268": 18, "997341": 131, "999": [134, 178], "99902063": 12, "9999": 129, "9\u03c0": 131, "A": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 14, 16, 17, 18, 19, 20, 127, 128, 131, 132, 134, 136, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 150, 151, 152, 153, 155, 156, 158, 159, 165, 166, 167, 174, 177, 178], "AND": 160, "And": [165, 169], "As": [2, 5, 10, 15, 17, 131, 132, 136, 149, 151, 152, 155, 156, 158, 159, 162, 167, 175, 177, 178], "At": [14, 17, 158], "Be": 156, "But": [137, 163], "By": [2, 4, 10, 17, 18, 131, 137, 138, 139, 140, 141, 146, 147, 148, 173], "For": [2, 3, 5, 7, 8, 9, 10, 17, 18, 19, 128, 129, 136, 151, 152, 153, 154, 155, 156, 158, 159, 160, 161, 162, 163, 165, 167, 169, 174, 178], "If": [1, 2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 128, 129, 132, 134, 137, 139, 140, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 160, 165, 167, 169, 171, 174, 175, 178], "In": [2, 7, 9, 13, 15, 16, 19, 128, 129, 130, 131, 132, 137, 138, 139, 140, 141, 145, 146, 147, 154, 155, 156, 158, 159, 161, 162, 165, 166, 167, 169, 173, 174, 175, 177, 178], "It": [2, 4, 6, 7, 9, 10, 11, 12, 16, 17, 127, 136, 137, 140, 141, 144, 145, 146, 148, 155, 156, 158, 159, 161, 162, 163, 165, 174, 177], "Its": 148, "No": [16, 17, 18, 150, 155, 159, 160, 177], "Not": [17, 155, 159], "OR": 160, "On": [131, 132, 133, 134, 135, 155, 156, 159, 175], "One": [7, 137, 140, 141, 156, 158, 159], "Or": [154, 160], "Such": [15, 167], "That": [3, 132, 158, 163], "The": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 161, 164, 165, 166, 168, 169, 170, 171, 172, 173, 174, 176, 177, 178], "Then": [1, 15, 159, 160, 165, 167], "There": [7, 15, 127, 129, 130, 133, 134, 136, 140, 142, 148, 151, 152, 154, 155, 156, 165], "These": [9, 126, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 160, 174, 177], "To": [1, 2, 4, 9, 10, 13, 15, 17, 18, 127, 128, 129, 131, 132, 144, 154, 155, 156, 158, 165, 167, 169, 174, 175, 177, 178], "WITH": 173, "Will": [9, 17, 20, 156], "With": [6, 14, 17, 148, 151, 152, 156, 163, 173, 174, 175, 178], "_": [9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 128, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 157, 160, 163, 167, 169, 175, 178], "_2": [137, 138, 139, 140, 141, 144, 145, 146, 147], "__all__": 156, "__class__": 178, "__del__": 156, "__eq__": 155, "__future__": [174, 177, 178], "__get_attr__": 156, "__getattr__": 156, "__getitem__": 155, "__init__": [2, 9, 14, 15, 16, 18, 156, 163, 165, 167, 174, 175, 177, 178], "__len__": 155, "__main__": 178, "__name__": 178, "__setitem__": 155, "_action": 141, "_action_to_direct": [159, 165], "_agent_loc": [159, 165], "_async_work": 11, "_bigint_from_byt": 155, "_build": 1, "_control": 141, "_cost": [140, 141], "_dtypedict": 5, "_episod": [14, 17], "_final_info": 14, "_final_observ": 14, "_get_info": [159, 165], "_get_ob": [159, 165], "_int_list_from_bigint": 155, "_k": 14, "_modul": 18, "_nois": [137, 138, 139, 140, 141, 142, 143, 146, 147], "_np_random": [2, 5, 10, 155], "_np_random_se": [2, 10], "_rang": [140, 141], "_render_fram": 165, "_replac": 175, "_reward_ctrl": 14, "_reward_run": 14, "_scale": [137, 138, 139, 140, 141, 142, 143, 146, 147], "_script": 1, "_static": [1, 173], "_step_mujoco_simul": 156, "_supportsdtyp": 5, "_target_loc": [159, 165], "_timelimit": 155, "_update_running_mean": [14, 19], "_worker": 11, "_x_posit": 14, "_x_veloc": 14, "a2c": [156, 170, 176], "a3c": 178, "a_": [166, 178], "a_0": 6, "a_i": 6, "a_max": 178, "a_min": 178, "a_n": 6, "a_t": 166, "aaronwalsman": 156, "ab": [128, 156, 178], "abbeel": [137, 178], "abdomen": [140, 141], "abdomen_i": [140, 141], "abdomen_x": [140, 141], "abdomen_z": [140, 141], "abil": [156, 158, 162], "abl": [156, 166], "abouelsaadat": 156, "about": [2, 3, 9, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 156, 158, 160, 161, 162, 165, 166, 174, 177], "abov": [2, 6, 7, 9, 131, 132, 135, 136, 156, 158, 161, 177, 178], "absolut": [141, 143, 147, 169], "abstract": [156, 165], "ac": [150, 163, 174], "academ": 162, "academia": 156, "acceler": [128, 133, 134, 135, 148, 155, 156, 178], "accent_r": 174, "accept": [2, 5, 7, 9, 17, 155, 156, 165, 169], "access": [14, 15, 17, 148, 155, 156, 158, 160, 161, 167], "accid": 155, "accident": [155, 156], "accord": [4, 5, 6, 7, 129, 169, 178], "accordingli": 165, "account": [148, 155, 156, 175], "accur": [136, 156, 163], "accuraci": 136, "achiev": [2, 131, 150, 155, 158, 162, 169, 173, 178], "acquir": 136, "acrobot": [130, 155], "acrobotenv": 131, "acronym": 177, "across": [13, 156, 173], "act": [14, 156, 158, 162, 163, 167, 174], "action": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 15, 17, 20, 130, 136, 148, 149, 155, 156, 157, 160, 161, 165, 167, 169, 170, 175, 176, 177, 178], "action_log_prob": 178, "action_logit": 178, "action_logits_vec": 178, "action_mask": [154, 173], "action_masking_taxi": 173, "action_mean": 177, "action_pd": 178, "action_s": 175, "action_shap": 178, "action_spac": [2, 5, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 154, 156, 157, 158, 159, 160, 161, 163, 165, 167, 169, 173, 174, 175, 177], "action_space_dim": 177, "action_stddev": 177, "action_valu": 174, "actionwrapp": [14, 15, 16], "actor": 177, "actor_lay": 178, "actor_loss": 178, "actor_losses_moving_averag": 178, "actor_lr": 178, "actor_optim": 178, "actor_weight": 178, "actor_weights_path": 178, "acttyp": [2, 3, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 156], "actual": [137, 154, 156, 158, 159, 161, 163, 165, 175, 178], "actuat": [131, 132, 140, 141, 156, 169], "acycl": 148, "ad": [14, 16, 17, 18, 19, 129, 132, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 154, 155, 156, 158, 160, 165], "adamw": 177, "adapt": [132, 142, 143, 148, 151, 152, 161], "add": [1, 4, 5, 9, 11, 16, 17, 18, 19, 20, 128, 136, 137, 140, 141, 151, 152, 154, 155, 156, 158, 161, 163, 165, 167, 174, 178], "add_mark": 156, "add_subplot": 174, "addit": [2, 5, 129, 130, 148, 150, 154, 155, 156, 158, 159, 161, 163, 165, 169, 174, 177, 178], "addition": [148, 155, 156], "additional_wrapp": [4, 156], "addrenderobserv": [18, 20, 156], "address": 156, "addwhitenois": 156, "adilzouitin": 155, "adjac": 6, "adjust": [148, 169], "advanc": [11, 131, 148, 156, 161], "advantag": [137, 156, 165], "advis": 14, "affect": [6, 156, 159], "affin": [14, 16, 18, 20, 129], "after": [2, 3, 5, 9, 10, 17, 129, 137, 138, 139, 140, 141, 144, 145, 146, 147, 150, 154, 155, 156, 158, 160, 161, 163, 165, 166, 173, 174, 177, 178], "again": [2, 129, 154, 165], "against": [148, 155], "agent": [2, 4, 5, 14, 17, 20, 127, 128, 129, 133, 137, 138, 139, 140, 141, 142, 143, 145, 146, 147, 148, 155, 156, 159, 160, 162, 165, 166, 167, 173, 175], "agent_i": 159, "agent_posit": 167, "agent_x": 159, "agnost": [137, 138, 139, 140, 141, 146, 147], "ago": 156, "ahead": 155, "ahmedo42": 155, "ai": 148, "aim": [136, 139, 146, 147, 155, 156, 164, 168, 170, 172, 176, 177], "air": [144, 148, 156], "al": [4, 16, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 155, 156, 160, 174], "ale_pi": [17, 156, 160], "alexdluken": 156, "algorithm": [2, 5, 10, 148, 149, 154, 155, 156, 158, 159, 160, 161, 163, 166, 169, 171, 174, 175, 177, 178], "alias": 148, "align": [154, 156, 160], "aliv": [140, 147], "alive_bonu": 142, "all": [2, 4, 5, 6, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 126, 128, 129, 130, 131, 132, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 155, 156, 158, 159, 160, 167, 169, 170, 171, 173, 174, 175, 177, 178], "all_act": 175, "all_stat": 175, "alloc": 159, "allow": [3, 4, 5, 6, 9, 11, 12, 14, 15, 17, 18, 19, 20, 131, 132, 133, 134, 135, 140, 141, 142, 143, 147, 148, 155, 156, 158, 159, 160, 165, 167, 177, 178], "almost": 155, "along": [2, 9, 10, 15, 18, 128, 132, 133, 134, 142, 143, 146, 151, 152, 155, 156, 158], "alongsid": 158, "alpha": [161, 173], "alphabet": 7, "alphanumer": 7, "alreadi": [2, 10, 15, 156, 158], "alreadypendingcallerror": 11, "also": [2, 7, 9, 10, 11, 12, 17, 18, 127, 128, 129, 130, 136, 137, 143, 148, 155, 156, 158, 159, 160, 165, 166, 167, 169, 174, 175, 177, 178], "alter": [2, 15, 156, 158, 165], "altern": [1, 148, 156, 159], "although": [7, 137, 169], "altogeth": 169, "alwai": [7, 8, 17, 129, 133, 134, 137, 140, 141, 142, 145, 146, 150, 151, 152, 153, 156, 158, 163, 165], "amacati": 156, "ambigu": 160, "among": [16, 130, 136], "amount": [9, 127, 132, 142, 143, 177], "amp": 156, "amtamasi": 155, "an": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 165, 166, 167, 169, 171, 173, 175, 178], "analog": 2, "analogi": 144, "analysi": [148, 161], "analyt": 142, "analyz": 161, "anderson": [132, 142, 143], "andrea": [156, 169, 175], "andrew": [133, 134, 156, 175], "andrewtanj": 155, "anerrupt": 156, "angl": [127, 129, 131, 132, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 158, 159], "angle_1": 137, "angle_2": 137, "angle_3": 137, "angle_4": 137, "angular": [127, 129, 131, 132, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "ani": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 20, 129, 132, 137, 139, 140, 142, 143, 146, 147, 148, 153, 155, 156, 158, 159, 165, 166, 169, 174, 175, 177], "anim": [9, 136], "ankle_1": 137, "ankle_2": 137, "ankle_3": 137, "ankle_4": 137, "annot": [155, 156, 174, 175, 177, 178], "annot_kw": 175, "annoy": 156, "anoth": [14, 15, 17, 137, 140, 141, 143, 147, 154, 155, 163, 166, 174, 177], "ansi": [2, 155, 156, 165], "ansi_list": 2, "answer": [148, 163, 165], "ant": [136, 155, 156, 169], "anymor": [14, 18, 19, 155, 156], "anyth": [148, 169, 175], "anytrad": 148, "anywher": [156, 159], "apach": 148, "apart": 165, "api": [2, 3, 14, 17, 20, 148, 155, 156, 157, 158, 164, 165, 166, 168, 169, 170, 178], "apicompat": 156, "appear": [133, 134, 158], "append": [14, 19, 156, 163, 173, 174, 175, 177, 178], "appli": [2, 4, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 127, 129, 130, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 155, 156, 160, 165, 167, 174, 177], "applic": [5, 7, 146, 148, 158, 159, 170, 172, 173, 176], "apply_along_axi": 174, "apply_api_compat": [4, 155, 156], "apply_env_compat": 156, "appreci": 155, "approach": [142, 155, 156, 160, 165, 173, 174, 177], "appropri": [156, 165, 169, 177], "approxim": [14, 19, 148, 163], "ar": [2, 4, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 158, 159, 160, 162, 163, 165, 166, 167, 169, 171, 173, 174, 177, 178], "araffin": 155, "arang": [174, 175, 178], "arbitrari": [2, 4, 7, 9, 148, 178], "arbitrarili": 156, "arcad": [17, 148], "archiv": 155, "archiveprefix": 156, "area": 136, "aren": 155, "arg": [9, 11, 12, 159, 163, 174, 177, 178], "argmax": [154, 163, 173, 174, 175], "argument": [4, 5, 6, 7, 8, 9, 10, 11, 12, 14, 16, 126, 130, 149, 155, 156, 158, 165, 169, 174], "ariel": 156, "arjun": [155, 156], "arm": [136, 140, 141, 144, 145, 148], "around": [3, 14, 126, 148, 155, 163], "arr": [163, 174], "arrai": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 20, 129, 131, 132, 133, 134, 135, 155, 156, 158, 159, 160, 163, 165, 167, 173, 174, 177, 178], "arrang": 4, "array_equ": [159, 165], "arrayconvers": [14, 17, 20, 156], "arraytyp": [10, 11, 12, 14], "arrow": [7, 175], "art": 163, "artemmiyi": 156, "articl": 175, "articul": [146, 148], "artifici": 154, "arxiv": [156, 178], "as_cmap": 175, "ascii": [155, 159], "ask": 159, "aspect": [155, 158, 166], "assert": [156, 165], "assess": 2, "asset": [153, 169], "assign": [2, 132, 133, 134, 144, 145, 148, 156, 174, 175], "assist": 148, "associ": [155, 156, 173], "assum": [7, 14, 18, 136, 156, 165], "assumpt": 160, "async": [4, 11, 156], "asynchron": [5, 10, 11, 12, 156], "asyncvectorenv": [10, 156, 162, 178], "atari": [9, 17, 20, 155, 156, 158, 174], "atari_wrapp": 18, "ataripreprocess": [17, 20, 156], "attach": [129, 132, 135, 137, 142, 143, 147], "attempt": [8, 129, 136, 154, 178], "attitud": 148, "attr": 6, "attribut": [4, 6, 11, 12, 17, 18, 19, 156, 158, 165, 167], "attributeerror": 156, "audio": 156, "augment": [18, 20, 158], "author": [133, 134, 155, 156, 169, 174, 175, 177, 178], "auto": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 156], "autobuild": 1, "autom": [148, 155], "automat": [1, 2, 4, 10, 11, 12, 14, 17, 18, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 155, 156, 163, 165, 178], "automata": [148, 156], "autoreset": [4, 10, 11, 12, 17, 20, 156], "autoreset_mod": [10, 11, 12, 156], "autoresetmod": [10, 11, 12, 156], "autoresetwrapp": [17, 155, 156], "autorom": [155, 156], "aux_1": 137, "aux_2": 137, "aux_3": 137, "aux_4": 137, "auxiliari": [2, 159, 165], "avail": [4, 10, 129, 148, 150, 151, 152, 155, 156, 159, 160, 161, 165, 169, 171, 173], "averag": [9, 14, 19, 20, 161, 163, 166, 174, 175, 177], "average_reward": 163, "avg_length": 161, "avg_rec": 161, "avg_reward": [161, 177], "aviat": 148, "avoid": [10, 13, 15, 151, 152, 154, 158, 159, 169, 173], "awai": [137, 138, 139, 140, 144, 145, 146, 147, 154, 167, 175], "awak": 129, "awar": [148, 156], "award": 132, "ax": [5, 7, 163, 165, 174, 175, 178], "ax1": 174, "ax2": 174, "axb2035": 156, "axi": [17, 18, 133, 134, 137, 140, 141, 146, 173, 174, 175], "ayesh": 156, "b": [1, 7, 144, 145, 154, 155], "b14c": 169, "b2dtut": 128, "b5": 7, "back": [11, 14, 15, 17, 18, 20, 126, 136, 137, 138, 156, 169], "back_leg": 137, "backend": [155, 156, 165], "background": 128, "backlog": 156, "backport": 155, "backward": [138, 155, 156, 177, 178], "bad": [13, 158, 159, 163], "badia": 178, "balanc": [132, 142, 143, 158, 159, 163, 173, 177, 178], "bali": 156, "balisujohn": [155, 156], "bandit": 148, "bar": [9, 163, 178], "bare": 15, "barto": [2, 131, 132, 142, 143, 150, 151, 152, 155, 174, 175], "base": [2, 4, 5, 9, 10, 13, 14, 15, 17, 18, 19, 20, 126, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 154, 155, 156, 158, 159, 163, 165, 167, 169, 173, 174, 177, 178], "base_env": 15, "base_random_se": 173, "baselin": 148, "baselines3": [18, 171], "basemujocoenv": 156, "bash": 155, "basic": [156, 159, 160, 161, 163, 169, 171], "basicconfig": 161, "basilisk": 148, "batch": [5, 10, 11, 12, 13, 14, 155, 178], "batch_spac": [5, 13, 156], "bbox_inch": 173, "bbox_to_anchor": 174, "beanpow": 156, "beat": [148, 150], "beatabl": 174, "becam": 155, "becaus": [136, 160, 163, 165, 167, 169, 173, 174, 178], "becom": [126, 155, 156, 163, 166, 178], "been": [2, 9, 10, 15, 129, 137, 140, 141, 148, 155, 156, 158, 159, 165, 166, 175, 178], "befor": [2, 4, 9, 10, 14, 15, 16, 17, 18, 19, 20, 128, 137, 138, 139, 140, 144, 145, 146, 147, 155, 156, 158, 160, 163, 165, 167, 169, 177, 178], "began": 156, "begin": [14, 17, 155, 158, 159, 160, 165, 174, 178], "beginn": [156, 159], "behav": [155, 161], "behavior": [14, 15, 135, 136, 137, 138, 139, 140, 141, 146, 147, 148, 155, 156, 158, 159, 160, 161, 163, 165, 167, 169], "behaviour": [129, 136, 156], "behind": [2, 137, 140, 156, 160], "being": [3, 4, 6, 7, 8, 17, 129, 133, 134, 135, 137, 140, 141, 144, 145, 155, 156, 158, 159, 163, 169, 174, 175], "believ": 156, "bellman": 163, "belong": 6, "below": [7, 10, 20, 135, 147, 156, 158, 160, 166, 174, 178], "benchmark": [126, 148], "benchmark_init": 9, "benchmark_rend": 9, "benchmark_step": 9, "benefit": [17, 156, 173], "bennet": 148, "besid": 136, "best": [163, 173, 174, 175, 178], "better": [127, 155, 156, 159, 160, 163, 173, 178], "between": [3, 6, 7, 14, 17, 18, 19, 20, 129, 131, 132, 135, 136, 137, 138, 139, 140, 141, 142, 143, 145, 146, 147, 148, 155, 156, 158, 159, 160, 163, 165, 166, 174, 175, 177, 178], "beyond": 156, "bf1797a3": 169, "bfoot": 138, "bia": [137, 138, 139, 140, 141, 146, 147, 178], "bias": [161, 178], "big": [163, 165, 175], "bigger": 175, "biggest": [160, 175], "bike": [158, 163], "binari": [5, 7, 148, 158, 165, 173], "bind": [126, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155], "biomechan": 136, "bipe": 136, "biped": [126, 140, 141, 147, 155, 169], "bipedal_walk": 127, "bipedalwalk": [127, 155], "biplan": 148, "bird": 148, "bit": 155, "bitcraz": 148, "bkrl": 155, "black": [131, 155, 156, 174, 175], "blackjack": [149, 155, 156, 170, 176], "blackjack_q_learn": 174, "blackjackag": [163, 174], "blit": 165, "blob": [151, 152, 155, 169], "block": 156, "blog": [155, 156, 160], "blue": [131, 154, 165, 173, 175], "blueski": 148, "board": 148, "board_gam": 155, "bodi": [129, 136, 137, 138, 139, 140, 141, 142, 144, 146, 147, 169], "boilerpl": [15, 158, 165, 167], "bonu": [147, 178], "book": [131, 150, 151, 152, 155, 174], "book_or_nip": 131, "bool": [2, 4, 5, 6, 7, 9, 10, 11, 12, 14, 15, 17, 18, 132, 136, 137, 138, 139, 140, 141, 146, 147, 163, 165, 173, 174, 175, 177], "bool8": 156, "bool_": 156, "boolean": [2, 5, 9, 14, 17, 129, 156, 174, 177], "booster": 129, "bootstrap": [2, 160, 166, 173, 178], "bot": 148, "both": [7, 10, 11, 12, 18, 127, 130, 131, 147, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 160, 161, 162, 165, 166, 173, 175, 177], "bother": 165, "bottom": [128, 133, 134, 139, 151, 152, 156, 159, 175], "bound": [2, 7, 14, 16, 17, 18, 19, 20, 129, 131, 132, 133, 134, 135, 155, 156, 158, 159, 166], "boundari": 8, "bounded": 5, "box": [2, 5, 6, 7, 8, 10, 11, 13, 14, 15, 16, 17, 18, 20, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 165, 167], "box2d": [127, 128, 129, 155, 156, 158], "brake": 128, "brax": [148, 156], "break": [155, 156, 160, 163, 175], "bridg": 148, "bring": 156, "britojr": 156, "brittl": 177, "broken": [17, 155], "brown": 156, "browser": 1, "bshin": 138, "bsk": 148, "bsuit": 148, "bthigh": 138, "btjanaka": 156, "buffalo": 148, "buffer": [14, 17, 128], "buffer_length": [14, 17, 161, 163, 174, 178], "bug": [17, 129, 136, 137, 139, 140, 142, 143, 144, 145, 147, 153, 155, 156, 160, 163], "build": [5, 126, 137, 138, 139, 140, 141, 142, 143, 146, 147, 148, 156, 158, 161, 165, 167], "built": [13, 148, 155, 156, 159, 162], "bullet": 148, "bump": 155, "bunch": 175, "burden": 177, "bushi": 9, "busi": 158, "bust": [150, 163, 174], "button": [5, 7, 9, 158], "c": [9, 129, 131, 156, 165, 177], "cab": 154, "calcul": [14, 18, 19, 135, 137, 142, 151, 152, 153, 154, 159, 161, 169, 173, 178], "call": [2, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 137, 144, 145, 150, 153, 155, 156, 158, 159, 160, 163, 165, 169, 174, 178], "call_async": 156, "call_wait": 156, "callabl": [3, 4, 9, 11, 12, 13, 14, 16, 17, 18, 19, 156], "callback": [9, 155], "cambridg": [133, 134], "camera": [136, 137, 138, 139, 140, 146, 147], "camera_id": 136, "camera_nam": 136, "campbel": 128, "can": [1, 2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 165, 167, 169, 173, 175, 177, 178], "cannot": [4, 8, 13, 17, 148, 151, 152, 155, 156, 165, 166, 171], "canva": 165, "capabl": [155, 157, 161], "capped_cubic_video_schedul": [9, 17], "captur": [9, 17], "car": [126, 130, 148, 155, 158], "car_rac": [128, 155, 158], "card": [150, 163, 174], "cardin": 159, "care": [5, 148, 163], "carl": 148, "carlo": [163, 174, 177, 178], "carloslui": 155, "carrac": [9, 14, 18, 128, 155, 156, 158], "cart": [130, 142, 143, 158, 177], "cart_posit": 158, "cart_veloc": 158, "cartesian": [6, 7, 135], "cartpol": [2, 9, 10, 14, 16, 17, 18, 19, 130, 132, 136, 142, 143, 148, 155, 156, 158, 160, 161, 163, 171, 177], "cartpoleenv": [17, 132, 156], "cartpolejax": 17, "cartpolevectorenv": [132, 156], "casadi": 148, "case": [2, 3, 5, 6, 7, 13, 14, 16, 128, 137, 138, 139, 140, 141, 146, 147, 154, 156, 158, 159, 160, 165, 166, 167, 169, 177, 178], "casino": [163, 174], "cast": 18, "cat": 138, "catch": [156, 159, 161], "categor": [7, 178], "categori": 1, "caught": 155, "caus": [140, 147, 154, 155, 156, 162, 163], "cbar": 174, "cc": 131, "cclauss": 155, "ccmdp": 148, "cd": 1, "cell": [148, 151, 152, 159, 165], "cellular": [148, 156], "center": [14, 18, 20, 128, 129, 132, 135, 137, 140, 141], "centr": [137, 140, 141], "central": 156, "centric": 177, "certain": [2, 143, 145, 155, 156, 174, 178], "cfrc_ext": [137, 140, 141], "chain": [15, 131, 146, 158], "challeng": [148, 163, 174], "chanc": [11, 148, 154], "chandrasekar": 177, "chang": [1, 2, 3, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 143, 146, 147, 148, 154, 155, 156, 158, 159, 162, 165, 167, 169, 174, 177], "changelog": [4, 155, 156], "channel": [14, 17, 18], "charact": [7, 9], "character": 148, "charg": [6, 148], "charlist": 7, "charraut": 156, "charset": 7, "cheat": 163, "check": [1, 2, 5, 7, 15, 17, 20, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 158, 160, 163, 165, 167, 169, 174, 175], "check_env": [9, 156, 159, 160], "check_environments_match": 156, "checker": [4, 20, 155, 156], "cheetah": 136, "chess": 158, "child": 13, "children": 11, "choic": [158, 159, 173, 175, 177, 178], "choos": [158, 163, 165, 169, 173, 175], "choose_act": 175, "chosen": [2, 7, 151, 152, 175, 178], "chri": 128, "christofkaufmann": 156, "chrisyeh96": 156, "chunk": 17, "ci": [9, 155, 156], "cinert": [140, 141], "circl": 165, "citat": 156, "cite": 156, "civil": 148, "clamp": [140, 141], "clarifi": [155, 156], "clariti": 159, "class": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 14, 15, 17, 18, 19, 136, 148, 155, 156, 158, 159, 162, 163, 165, 167, 169, 174, 175, 177, 178], "classic": [129, 131, 132, 133, 134, 135, 139, 143, 146, 147, 148, 155, 156, 158, 166, 173], "classic_control": [17, 155], "classif": 148, "classmethod": 15, "clean": [2, 148], "cleaner": [154, 160], "cleanup": 155, "clear": [13, 17, 156, 158, 159, 160, 161, 163], "clear_mpi_env_var": 13, "clearer": [2, 155, 161], "clearli": 5, "clementperroud": 156, "cliff": [149, 156], "cliff_walk": [151, 152], "cliffwalk": [151, 152, 155, 156], "cliffwalkingslipperi": 152, "climb": 130, "clip": [14, 16, 19, 20, 133, 134, 137, 156, 158, 159, 165, 167, 178], "clip_reward": 165, "clipact": [14, 16, 20, 158], "clipreward": [10, 14, 19, 20, 156, 167], "clobber": 155, "clock": [161, 165], "clockwis": 135, "clone": [148, 169], "close": [2, 3, 7, 9, 10, 11, 12, 14, 15, 17, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 136, 137, 139, 140, 145, 147, 155, 156, 157, 158, 160, 161, 167, 169, 173, 174, 175, 178], "close_extra": [10, 11, 12], "closechoic": 156, "closer": [129, 150, 156, 163], "closest": 127, "cloudpickl": 13, "cloudpicklewrapp": 13, "cluster": 148, "cmap": [174, 175], "cnt": 156, "co": [131, 133, 134, 135, 142, 145, 148], "coars": 131, "code": [2, 3, 5, 6, 9, 11, 14, 15, 17, 18, 19, 131, 148, 155, 156, 161, 162, 165, 167, 169, 170, 173, 174, 175, 177, 178], "codebas": [156, 160, 165], "coeffici": [146, 178], "coin": 7, "coincid": 165, "col": [151, 152, 153], "cola": 156, "colder": 155, "collabor": 161, "collect": [2, 10, 11, 12, 17, 20, 148, 156, 157, 161, 163, 169, 174, 178], "collector": 156, "collid": 129, "collis": [133, 134, 148, 155], "color": [2, 6, 154, 173], "color_palett": 175, "colour": [128, 155], "column": [4, 163, 175, 177], "com": [19, 140, 141, 151, 152, 153, 155, 165, 169, 171, 175, 177], "combin": [2, 5, 9, 15, 145, 158, 159, 178], "come": [129, 137, 138, 139, 140, 146, 147, 156], "comet": 156, "command": [136, 165], "comment": [136, 155, 156, 178], "commit": [156, 165], "common": [7, 15, 18, 20, 156, 160, 161, 166, 167, 170, 172, 176, 177], "commonli": [20, 155], "commonroad": 148, "commun": [11, 155, 160, 161], "compar": [139, 140, 146, 147, 148, 160, 161, 173, 174, 175, 178], "comparison": [161, 173], "compartment": 156, "compat": [14, 17, 18, 20, 144, 148, 155, 156, 165, 166, 167, 169, 173, 174, 175, 177, 178], "compet": 161, "compil": [148, 155, 162], "compilergym": 148, "complement": 2, "complet": [1, 4, 11, 17, 128, 129, 156, 158, 159, 161, 163, 166, 167, 174], "complex": [5, 6, 136, 140, 141, 142, 143, 148, 156, 158, 160, 161, 162, 177, 178], "compli": 155, "complianc": 155, "compliant": 155, "complic": [7, 15, 160, 167], "compon": [18, 158, 159, 160, 165], "compos": [9, 137, 138, 139, 140, 141, 143, 146, 147], "composit": 7, "compound": 8, "comprehens": [148, 155], "compris": 7, "comput": [2, 3, 9, 14, 18, 19, 20, 136, 137, 155, 156, 159, 161, 163, 165, 173, 174, 177, 178], "computation": [148, 162], "compute_metr": 9, "concat": 175, "concaten": [5, 8, 11, 12, 13, 136, 156], "conceptu": [7, 160, 163], "concern": 177, "conda": [156, 165], "condit": [2, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 166, 169, 174, 177], "conduct": 156, "confid": 161, "config": 4, "configur": [126, 130, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 159, 160, 161, 165, 174, 178], "confirm": [131, 155], "conflict": 9, "congratul": [159, 163], "conjunct": [9, 13], "connect": [2, 6, 11, 131, 137, 138, 139, 140, 141, 145, 146, 147, 148], "connectionist": 177, "consecut": 129, "consequ": [155, 158, 163], "consid": [4, 128, 129, 130, 136, 137, 139, 140, 143, 147, 165, 167, 173], "consist": [3, 7, 127, 129, 131, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 155, 156, 158, 159, 160, 161, 162, 163, 165, 167, 169, 173, 174, 177], "consol": [4, 161], "consolid": 155, "constant": [3, 129, 134, 137, 140, 141, 142, 163], "constantli": 145, "constitu": 6, "constrain": [148, 173], "constraint": [140, 141, 142, 148, 159, 160], "construct": [7, 9, 131, 137, 138, 139, 140, 141, 146, 147, 148], "constructor": [4, 9, 15, 155, 156, 158, 165], "consult": 169, "consumpt": 2, "contact": [127, 129, 136, 137, 140, 141, 142, 155], "contact_cost": [137, 140], "contact_cost_rang": 140, "contact_cost_weight": [137, 140, 169], "contact_force_rang": 137, "contain": [1, 2, 5, 8, 10, 13, 17, 18, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 165, 169, 171, 174, 177, 178], "content": 161, "context": [4, 11, 13, 148, 177], "contextu": 148, "continu": [2, 5, 9, 14, 18, 19, 128, 129, 130, 133, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 158, 159, 166, 174, 177, 178], "continuous_mountaincarenv": 134, "contribut": [126, 148, 156, 171], "contributor": 156, "control": [2, 5, 7, 126, 128, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 163, 167, 169, 175, 178], "conveni": [6, 15, 158, 159, 165], "convent": [1, 2], "converg": [163, 173, 174, 175], "convers": [3, 148, 156], "convert": [1, 5, 6, 14, 17, 18, 20, 129, 148, 155, 156, 159, 160, 174, 175], "convert_to_done_step_api": [9, 160], "convert_to_terminated_truncated_step_api": [9, 160], "convolution_mod": 163, "convolv": [156, 163, 174, 178], "cool": 156, "coordin": [7, 14, 127, 129, 135, 137, 138, 139, 140, 141, 144, 145, 146, 147, 148, 159], "coordinatesof": 142, "copi": [10, 11, 12, 13, 159, 165], "copier": 165, "core": [155, 156, 158, 159, 163], "correct": [4, 9, 10, 16, 129, 148, 154, 155, 156, 158, 160, 163, 165, 166, 177], "correctli": [2, 9, 14, 18, 19, 155, 156, 165, 166], "correspond": [1, 2, 4, 7, 11, 12, 15, 18, 129, 131, 132, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 154, 165, 175, 177, 178], "correspondingli": 128, "cosin": [131, 142, 145], "cost": [127, 156], "could": [2, 9, 14, 137, 138, 139, 140, 141, 143, 146, 147, 156, 158, 159, 160, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "couldn": 160, "coulom": 146, "count": [7, 127, 129, 150, 163, 174], "counter": [135, 156], "coupl": 178, "cours": [148, 175], "cover": [5, 12, 174], "coverag": 148, "cpu": [129, 136, 162, 178], "craft": 129, "craftium": 148, "crash": [129, 158], "crazyfli": 148, "creat": [4, 5, 7, 9, 10, 11, 12, 13, 14, 15, 17, 127, 128, 129, 145, 148, 155, 156, 158, 160, 161, 162, 163, 167, 169, 173, 174, 177, 178], "create_empty_arrai": [5, 13, 156], "create_grid": 174, "create_plot": 174, "create_se": 155, "create_shared_memori": [5, 13], "creation": [2, 4, 156, 160, 165], "creatur": 148, "criteria": [158, 159], "critic": [2, 17, 156], "critic_lay": 178, "critic_loss": 178, "critic_losses_moving_averag": 178, "critic_lr": 178, "critic_optim": 178, "critic_weight": 178, "critic_weights_path": 178, "cross": [151, 152, 153], "crucial": [5, 10, 158, 159, 160], "crypto": 148, "cstride": 174, "ctr_cost": 147, "ctrl_cost": [137, 138, 139, 140, 146, 147], "ctrl_cost_weight": [137, 138, 139, 140, 141, 146, 147, 169], "ctx": 13, "cube": 5, "cuda": [148, 178], "cum_reward": 175, "cumsum": 175, "cumul": [9, 14, 17, 20, 175], "cumulative_reward": 9, "cupi": [14, 17], "current": [2, 4, 7, 9, 10, 17, 18, 128, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 162, 163, 165, 173, 174, 175, 177, 178], "current_col": [151, 152, 153], "current_namespac": 4, "current_q": 163, "current_row": [151, 152, 153], "curriculum": 155, "curv": [155, 161, 173], "custom": [2, 5, 10, 11, 12, 14, 15, 17, 18, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 155, 156, 158, 161, 163, 168, 170], "customis": 148, "customiz": 148, "customspaceerror": 13, "cut": [160, 163], "cvel": [140, 141], "cyaneu": 153, "cylind": 144, "cython": 156, "d": [7, 9, 15, 131, 148, 159, 171, 178], "dac": 148, "dacbench": [148, 156], "daemon": 11, "dag": 148, "dai": 126, "danger": 173, "darkgrid": 177, "data": [5, 8, 9, 10, 15, 148, 155, 156, 158, 159, 161, 162, 163, 165, 167, 174, 175, 177, 178], "data_equival": 156, "data_equivil": 156, "databas": 2, "datafram": [175, 177], "datapoint": 8, "dataset": 156, "datatyp": 155, "david": 175, "davidpl1": 156, "davidslayback": 156, "de": 156, "dead": [155, 156], "deal": [6, 178], "dealer": [150, 155, 163, 174], "dealer_card": 163, "dealer_count": 174, "debug": [2, 5, 9, 148, 149, 155, 156, 158, 160, 161, 163], "decai": [163, 174], "decay_epsilon": [163, 174], "decent": [174, 177], "decid": [150, 156, 175], "decis": [148, 155, 156, 158, 159, 163, 166], "deck": [150, 163, 174], "declar": 159, "decomposit": 154, "decreas": [129, 162, 163, 175], "deep": [148, 155, 162, 166, 171, 175, 177, 178], "deepmind": [136, 155, 169], "def": [9, 14, 156, 159, 163, 165, 167, 169, 173, 174, 175, 177, 178], "default": [2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 155, 156, 158, 159, 165, 166, 169], "default_camera_config": [136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "default_rng": 175, "defaultdict": [163, 174], "defin": [2, 3, 5, 8, 11, 12, 14, 15, 16, 17, 18, 135, 155, 156, 158, 159, 165, 166, 167, 175, 178], "definit": [137, 139, 140, 142, 155, 156, 166], "deform": 148, "deformable_gym": 148, "degre": [11, 140, 141, 142, 167, 178], "delai": [18, 20, 156, 165], "delayobserv": [18, 20, 156], "deleu": 156, "deliv": 154, "delta": [175, 177], "demand": 128, "demo": 1, "demonstr": [14, 127, 148, 161, 169, 173, 178], "dennybritz": [151, 152], "denot": [2, 132, 153], "densiti": [144, 148, 156], "depend": [2, 6, 9, 10, 14, 18, 19, 126, 129, 130, 132, 136, 137, 138, 139, 140, 141, 146, 147, 153, 155, 156, 165, 175, 178], "dependencynotinstal": [9, 17], "deprec": [2, 136, 155, 156], "depreci": 155, "depth": 156, "depth_arrai": 136, "deque_s": [14, 17], "deriv": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 177], "derk": 148, "desc": [153, 175], "describ": [2, 5, 6, 7, 131, 132, 146, 150, 155, 156, 158, 167], "descript": [6, 20, 136, 156, 165], "design": [131, 140, 141, 148, 149, 154, 156, 163], "desir": [9, 14, 154, 159, 169, 178], "despit": 156, "destin": [154, 173], "destroi": [129, 156], "detach": 178, "detail": [5, 6, 7, 9, 19, 131, 148, 155, 156, 158, 159, 161, 163, 165, 169, 173, 178], "detect": [156, 160, 165], "determin": [2, 17, 129, 131, 132, 133, 134, 135, 153, 155, 156, 158, 159, 165, 166, 169], "determinist": [16, 129, 131, 133, 134, 165, 178], "dev": [2, 155, 177], "develop": [136, 148, 155, 156, 160, 161, 163, 171, 177], "deviat": [146, 163, 177, 178], "devic": [14, 17, 156, 178], "devicearrai": 17, "dexter": 148, "dexteroushand": 148, "df1": 177, "di": 160, "diagnost": 2, "diagon": 159, "diagram": 135, "dict": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 18, 20, 136, 151, 152, 153, 154, 155, 156, 158, 159, 160, 165, 173, 177], "dict_info": 14, "dict_kei": 18, "dict_time_kei": 18, "dictat": [128, 129], "dictinfotolist": [10, 14, 20, 156], "dictionari": [2, 5, 6, 7, 9, 10, 14, 18, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 159, 165, 167, 173, 174, 177], "did": [156, 166], "didn": [156, 175], "die": 128, "dietterich": 154, "differ": [2, 5, 6, 9, 11, 12, 16, 17, 18, 128, 135, 136, 147, 148, 155, 156, 158, 159, 160, 161, 163, 165, 166, 167, 169, 170, 172, 173, 175, 176, 178], "differenti": 166, "difficult": [132, 136, 142, 143, 156, 159, 160, 162, 163, 175], "difficulti": [155, 159], "digit": 7, "dim": [140, 141], "dimens": [5, 7, 8, 18, 148, 156, 177], "dimension": [5, 17, 129, 137, 138, 139, 146, 147, 156, 158, 159, 165, 178], "direct": [6, 131, 132, 133, 134, 137, 138, 139, 140, 142, 143, 146, 147, 148, 151, 152, 153, 154, 159, 163, 165, 175, 177], "directli": [2, 6, 10, 15, 17, 131, 136, 158, 159, 165, 174, 177], "directori": [1, 155, 165], "dirhtml": 1, "disabl": [4, 17, 18, 19, 151, 152, 153, 155, 156, 163, 169], "disable_env_check": [4, 16, 17, 155], "disable_logg": 17, "disable_print": 4, "disable_render_order_enforc": [17, 155], "disallow": 154, "disc_to_cont": 167, "discard": 18, "discord": [148, 155, 156, 160, 171], "discount": [14, 19, 160, 163, 166, 174, 175, 177, 178], "discount_factor": [163, 173, 174], "discourag": 155, "discov": [156, 169], "discret": [2, 5, 6, 7, 8, 11, 13, 18, 128, 129, 131, 132, 133, 134, 148, 149, 150, 151, 152, 153, 154, 155, 156, 158, 159, 163, 165, 167, 174], "discrete_act": 165, "discreteact": 167, "discreteenv": 155, "discuss": [155, 156, 159], "displac": [137, 138, 139, 140, 146, 147], "displai": [2, 4, 132, 155, 160, 165], "dissect": 175, "dist": 144, "distanc": [138, 139, 141, 144, 147, 159, 165], "distance_from_origin": [137, 140], "distance_penalti": 142, "distinct": [160, 166], "distinguish": [2, 159, 160, 165, 166], "distrib": 177, "distribut": [5, 6, 7, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 155, 156, 169, 175, 177, 178], "dive": 158, "divers": [148, 157], "dlpack": 156, "do": [4, 7, 13, 15, 17, 128, 129, 131, 155, 156, 158, 159, 161, 163, 165, 167, 169, 175, 177, 178], "doc": [9, 129, 155, 156, 167], "dockerfil": 155, "docstr": [1, 155, 156], "doctest": 156, "document": [5, 7, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 130, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 155, 156, 158, 160, 165, 169, 174, 178], "doe": [2, 6, 8, 9, 10, 11, 12, 13, 15, 17, 18, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 155, 156, 159, 165, 166, 167, 178], "doesn": [1, 2, 4, 15, 17, 129, 155, 156, 159, 166, 175], "dof": [137, 140, 141], "dog": 9, "doi": [154, 156], "domain": [16, 128, 131, 133, 134, 154, 167], "domain_random": 128, "don": [6, 14, 15, 128, 133, 155, 156, 158, 159, 160, 165, 166, 173, 175, 178], "done": [2, 9, 14, 155, 156, 158, 163, 165, 166, 169, 173, 174, 175, 177, 178], "doom": 148, "dot": [6, 7, 165], "doubl": 136, "doublependulum": 142, "down": [5, 7, 128, 141, 148, 150, 151, 152, 153, 154, 156, 159, 163, 165, 166, 173, 174, 175], "download": [165, 166, 167, 170, 173, 174, 175, 177, 178], "downward": 131, "dpi": 173, "dramat": [155, 156], "draw": [6, 150, 163, 165, 174], "drawn": [6, 7, 144, 146, 150, 163], "drive": [128, 173], "driver": 156, "drone": 148, "drop": [154, 156, 173], "drryanhuang": 156, "dry": 159, "dsctt": 155, "dstack": 174, "dt": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 169], "dtype": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 20, 129, 131, 132, 133, 134, 135, 155, 156, 159, 165, 175], "dtypeobserv": [14, 18, 20, 156], "dual": 148, "duburcqa": [155, 156], "duckietown": 148, "due": [2, 129, 132, 136, 153, 155, 156, 158, 160, 163, 166, 178], "dump": 156, "dunbar": 156, "dunder": 156, "duplic": [14, 156], "durat": [9, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 161, 177], "dure": [2, 4, 6, 7, 10, 14, 17, 18, 19, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 160, 165, 167, 169, 173], "dw": 9, "dx": [137, 138, 139, 140, 146, 147], "dylwil3": 156, "dynam": [2, 16, 131, 135, 136, 142, 148, 155, 156, 159, 160], "e": [1, 2, 4, 5, 7, 8, 9, 11, 13, 14, 15, 17, 20, 129, 137, 138, 139, 140, 141, 143, 144, 145, 146, 147, 148, 150, 153, 155, 156, 159, 165, 167, 174, 175, 177, 178], "e3c16072f695": 169, "each": [2, 5, 6, 7, 9, 10, 11, 12, 13, 14, 16, 17, 18, 20, 126, 127, 128, 129, 130, 131, 132, 133, 134, 136, 137, 140, 141, 142, 143, 144, 145, 148, 149, 151, 152, 154, 155, 156, 158, 159, 160, 161, 163, 165, 173, 174, 175, 178], "earli": [126, 161, 163, 174, 177], "earlier": [137, 140, 141, 165], "earliest": 177, "easi": [148, 149, 155, 158, 159, 175], "easier": [130, 155, 156, 158, 159, 178], "easiest": [128, 155, 156], "easili": [6, 10, 15, 148, 155, 156, 162], "east": [154, 173], "ed": 131, "edg": [5, 6, 8, 132, 155, 156, 158, 159, 163], "edge_link": [6, 8], "edge_mask": 6, "edge_spac": [6, 8], "edgecolor": 174, "edit": [148, 155, 165], "educ": 161, "effect": [2, 8, 13, 15, 17, 129, 137, 141, 142, 143, 144, 145, 146, 154, 158, 159, 161, 173, 174, 177], "effector": [144, 145], "effici": [11, 133, 134, 136, 148, 156, 159, 161, 162, 173, 178], "effort": [130, 156], "eg": 165, "egl": 136, "eight": 137, "einforc": 177, "either": [7, 8, 9, 12, 14, 16, 17, 133, 134, 148, 150, 153, 154, 156, 158, 160, 175, 177, 178], "ekalosak": [155, 156], "elaps": [14, 17], "elbow": 144, "electron": 148, "element": [2, 5, 6, 7, 10, 11, 13, 18, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 158, 165, 169, 177, 178], "elev": 169, "eleven": 136, "elf": 153, "elif": [159, 160], "elimin": 173, "elliottow": 156, "elo": 148, "els": [14, 18, 139, 147, 153, 154, 156, 159, 163, 165, 173, 174, 175, 178], "emb": 169, "embed": [161, 169], "emerg": [156, 161], "emit": 2, "emphas": 159, "emploi": 17, "empti": [5, 7, 13, 17, 137, 138, 139, 140, 141, 146, 147, 156, 159, 174, 175, 177], "emul": [155, 160], "en": [18, 177], "enabl": [4, 9, 17, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 128, 148, 155, 156, 160], "enable_wind": [129, 178], "encapsul": 2, "encod": [8, 148, 154, 155, 165], "encompass": 148, "encount": [160, 163, 178], "encourag": [155, 159, 169, 178], "end": [2, 3, 10, 14, 17, 127, 135, 136, 155, 156, 157, 158, 159, 160, 161, 163, 166, 169, 174, 175, 177, 178], "endeavor": 148, "energi": [127, 129, 132, 159, 167], "enforc": [4, 17, 155], "engin": [129, 136, 148, 156], "english": 7, "enough": [159, 169, 178], "ensur": [1, 2, 4, 6, 8, 9, 129, 148, 156, 158, 159, 161, 163, 165, 173, 174], "ent_coef": 178, "enter": [2, 9, 129, 151, 152], "entir": [9, 17, 139, 147, 155, 156, 178], "entiti": 5, "entrain": 148, "entri": [4, 155, 156, 159, 163], "entropi": [2, 178], "entropy_moving_averag": 178, "entry_point": [4, 155, 159, 165], "entrypoint": 165, "enum": [4, 10, 156, 165], "enumer": [173, 175], "env": [4, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 163, 166, 167, 169, 170, 173, 174, 175, 176, 177], "env_check": [9, 155, 156, 159], "env_devic": [14, 17], "env_fn": [11, 12], "env_id": [4, 156, 160], "env_lambda": 9, "env_mask": 173, "env_nam": [4, 161], "env_new": 9, "env_old": 9, "env_spec": 156, "env_spec_kwarg": 156, "env_typ": 1, "env_unmask": 173, "env_xp": [14, 17], "envapicompat": 155, "envcompat": 155, "envcreat": 4, "environ": [4, 5, 7, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 127, 128, 129, 130, 131, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 149, 150, 151, 152, 153, 154, 155, 156, 157, 161, 166, 167, 168, 170, 171, 172, 176, 177], "environment_cr": 165, "environmentnam": 156, "envpool": [155, 156], "envs_wrapp": 178, "envspec": [2, 3, 4, 10, 15, 17, 156], "ep": [175, 177], "ep_action_log_prob": 178, "ep_reward": 178, "ep_value_pr": 178, "episod": [2, 4, 9, 10, 14, 17, 18, 20, 155, 156, 157, 158, 159, 160, 163, 165, 166, 169, 173, 174, 175, 177, 178], "episode_data": 161, "episode_id": 9, "episode_index": 9, "episode_num": 161, "episode_ov": [158, 161], "episode_returns_moving_averag": 178, "episode_reward": [14, 19, 161, 163, 173], "episode_tim": 161, "episode_trigg": [9, 17, 161], "episodestatisticsrecord": 156, "epoch": 178, "eprint": 156, "epsilon": [14, 18, 19, 163, 173, 174, 175], "epsilon_decai": [163, 174], "epsilongreedi": 175, "equal": [11, 12, 129, 133, 134, 139, 144, 147, 150, 153, 154, 163, 175], "equat": [131, 135, 163], "equival": [4, 5, 8, 10, 14, 137, 140, 155, 156, 178], "erez": [139, 140, 141], "ericonaldo": 155, "error": [2, 4, 7, 8, 9, 11, 17, 20, 155, 156, 158, 163, 166, 174, 178], "errorr": 155, "escap": 2, "especi": [5, 160, 165, 167, 178], "essenti": [7, 161, 169], "estim": [19, 137, 160, 163, 166, 177, 178], "estimate_valu": 160, "et": [16, 17], "etc": [2, 5, 10, 14, 17, 137, 138, 139, 140, 146, 147, 155, 156, 158, 159, 160, 161, 165, 166, 167], "euclidean": [144, 145], "ev": 148, "ev2gym": 148, "eval": [161, 178], "eval_env": 160, "evalu": [14, 17, 18, 19, 148, 156, 160, 169, 174], "evanmath": 155, "even": [2, 4, 137, 139, 140, 142, 143, 147, 155, 159, 163, 165, 174], "event": [9, 155, 165], "eventu": [13, 158], "ever": [126, 155], "everi": [1, 5, 6, 9, 14, 17, 18, 19, 128, 129, 132, 137, 139, 140, 142, 143, 147, 156, 158, 159, 160, 165, 173, 177, 178], "everyon": 136, "everyth": [17, 148, 158, 159], "evolv": 9, "exact": [150, 156, 174], "exactli": [8, 146, 158, 159, 161], "exampl": [1, 2, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 128, 131, 136, 148, 150, 151, 152, 153, 155, 156, 158, 161, 163, 165, 166, 167, 169, 170, 172, 173, 174, 176, 178], "examplefuncenv": 156, "exce": [127, 150], "exceed": [2, 17, 20, 158, 174], "excel": 169, "except": [2, 7, 15, 155, 156, 159, 165], "exchang": 158, "excit": 156, "exclud": [4, 17, 20, 137, 138, 139, 140, 141, 142, 145, 146, 147, 154], "exclude_current_positions_from_observ": [137, 138, 139, 140, 141, 146, 147, 169], "exclude_namespac": 4, "exclus": [6, 136, 140, 141, 156], "execut": [1, 9, 16, 154, 158, 159, 165, 177, 178], "exhibit": 136, "exist": [2, 4, 5, 10, 11, 12, 15, 16, 17, 18, 19, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 158, 161, 162, 178], "exist_ok": 173, "exit": [9, 10, 11, 12], "exp": 177, "expand": [5, 7], "expect": [2, 4, 5, 6, 7, 155, 156, 158, 159, 169, 175, 177, 178], "expens": [5, 155], "experi": [17, 136, 137, 140, 141, 142, 143, 148, 158, 159, 163, 174, 175, 177, 178], "experienc": 163, "experiment": [3, 131, 156], "explain": [155, 166], "explan": [174, 177], "explanatori": 174, "explicit": [156, 160], "explicitli": [3, 165, 166, 169], "exploit": [173, 174, 175], "explor": [2, 5, 148, 156, 159, 162, 173, 174, 175, 178], "explor_exploit_tradeoff": 175, "exponenti": [7, 14, 19, 20], "export": 156, "expos": [3, 148, 156], "express": [5, 9, 137, 140, 141], "ext_control": 6, "extend": [2, 17, 137, 156], "extens": [148, 156, 177], "extent": 153, "extern": [2, 137, 140, 141, 155, 156, 160, 166], "extra": [155, 156, 158, 165, 174], "extract": [9, 156, 175], "extrem": [148, 149], "ez": 155, "ezpickl": [4, 9, 15], "f": [153, 158, 159, 161, 163, 173, 174, 175, 177, 178], "f_": [137, 140, 141], "face": [137, 140, 141, 150, 163, 174], "facecolor": 174, "facedown": 150, "facilit": 136, "fact": 177, "factor": [14, 19, 129, 174, 177, 178], "factori": 4, "fail": [156, 158, 160], "failur": [158, 159, 160, 161, 166], "fair": 7, "fairli": [155, 156, 177], "fall": [127, 140, 151, 152, 153, 158, 163, 166, 169, 175], "fallen": [139, 169], "fals": [4, 6, 9, 10, 11, 12, 14, 16, 17, 18, 19, 128, 129, 132, 137, 138, 139, 140, 141, 146, 147, 150, 154, 155, 156, 158, 159, 160, 161, 163, 165, 169, 173, 174, 175, 177, 178], "familiar": 169, "familiaris": 159, "famou": 163, "far": [127, 128, 141, 142, 144, 145, 153, 158], "farama": [10, 11, 12, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 148, 156, 165, 171, 174, 177, 178], "fast": [128, 136, 138, 140, 142, 146, 148, 158, 160, 163], "faster": [127, 129, 137, 140, 141, 142, 145, 156, 163, 173, 178], "fastest": 158, "favor": [2, 155, 156], "favorit": 174, "favour": [2, 155, 156], "featur": [6, 7, 18, 136, 155, 156, 160, 178], "feature_spac": 6, "fed": 178, "feed": 178, "feedback": [156, 158, 159, 163], "feel": [169, 177], "feet": [138, 147], "fetchreach": 160, "few": [1, 131, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 163, 169, 174, 175], "ffffffff": 153, "fffffhff": 153, "fffh": 153, "fffhffff": 153, "fffhfffg": 153, "ffoot": 138, "ffset": 177, "fhffhfhf": 153, "fhfh": 153, "fhhfffhf": 153, "fibonacci": 177, "fickl": [154, 156], "fickle_passeng": 154, "fidel": 148, "field": [156, 162], "fieteo": 155, "fig": [163, 174, 175, 178], "fig1": 174, "fig2": 174, "figaspect": 174, "fight": 148, "figsiz": [161, 163, 173, 174, 175, 177, 178], "figur": [139, 156, 161, 173, 174, 177], "file": [1, 131, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 161, 165, 169], "filenam": [9, 17, 161], "fill": 165, "filter": [14, 18, 20, 158, 173], "filter_kei": [14, 18], "filterobserv": [14, 18, 20], "filterobservationwrapp": 18, "final": [3, 9, 18, 155, 156, 159, 161, 163, 165, 166, 169, 174], "final_epsilon": [163, 174], "final_info": [14, 17, 155, 156], "final_observ": [14, 17, 155, 156], "find": [2, 4, 156, 158, 161, 162, 163, 165, 169, 175], "find_highest_vers": 4, "fine": [165, 178], "finetun": 148, "finfo": 175, "fingertip": [144, 145], "finish": [2, 128, 129, 155, 156, 158, 161, 163, 165, 178], "finit": [6, 7, 137, 143, 147, 166, 167, 177], "fire": 129, "firefoxmetzg": 155, "firmwar": 148, "first": [2, 4, 6, 9, 10, 11, 12, 15, 129, 131, 133, 134, 137, 138, 139, 140, 141, 142, 145, 146, 147, 151, 152, 154, 155, 156, 157, 159, 160, 161, 163, 165, 174, 175, 177], "five": [130, 155, 163, 177], "fix": [5, 6, 7, 14, 17, 19, 20, 129, 131, 132, 135, 136, 137, 138, 139, 140, 142, 143, 144, 145, 147, 148, 150, 153, 155, 156, 158, 159, 160, 165, 177], "fixtur": 145, "flag": [11, 133, 136, 148, 160], "flake8": [155, 156], "flappi": 148, "flat": [5, 6, 7, 8, 169], "flatdim": [5, 8, 155], "flatt": 178, "flatten": [5, 8, 14, 18, 20, 136, 155, 156, 158, 159, 163, 165, 174, 175, 178], "flatten_spac": [5, 8], "flattenobserv": [6, 14, 18, 20, 158, 159, 165], "flesh": 3, "flex": 144, "flexibl": [11, 148, 156, 159], "flight": 148, "float": [4, 7, 8, 9, 14, 16, 17, 18, 19, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 159, 163, 165, 173, 174, 175, 177, 178], "float32": [2, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 18, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 167], "float64": [5, 7, 8, 10, 14, 18, 19, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "flow": 148, "fluctuat": 163, "fluid": 146, "fly": [129, 160], "flycraft": 148, "fmt": 175, "fn": 13, "focu": [148, 159, 161, 178], "focus": [163, 171, 173], "foddi": 148, "folder": [1, 9, 17, 156, 161], "follow": [1, 3, 4, 5, 9, 10, 14, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 129, 131, 132, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 159, 165, 166, 167, 169, 174, 175, 177, 178], "fontsiz": [174, 175], "foot": [11, 138, 139, 140, 141, 147], "foot_joint": [139, 147], "foot_left_joint": 147, "forc": [15, 129, 132, 133, 134, 136, 137, 140, 141, 142, 143, 147, 155, 169, 177], "forcibli": 166, "forearm": [140, 141, 144], "forev": 166, "foreverska": 156, "forex": 148, "forg": 165, "forget": [14, 15, 158, 165], "forgot": 159, "fork": [1, 156, 157, 160], "form": [5, 6, 7, 17, 131, 146, 156, 165], "formal": 166, "format": [1, 4, 5, 9, 14, 156, 158, 159, 160, 161, 169], "formerli": 156, "forward": [13, 19, 127, 137, 138, 139, 140, 141, 146, 147, 155, 156, 177, 178], "forward_reward": [137, 138, 139, 140, 146, 147, 169], "forward_reward_weight": [137, 138, 139, 140, 146, 147, 169], "found": [20, 136, 142, 148, 155, 156, 174, 177], "foundat": [148, 156, 165, 171], "four": [128, 129, 137, 139, 148, 154, 156, 158, 159, 174], "foxik": 155, "fp": [2, 9, 10, 17, 129, 156, 165], "frac": [137, 138, 139, 140, 141, 146, 147], "frame": [2, 9, 10, 17, 18, 20, 128, 129, 144, 145, 155, 156, 161, 175], "frame_skip": [17, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 169], "framer": 165, "frameskip": 17, "frameskipobserv": 156, "framestack": [17, 18, 155, 156], "framestackobserv": [17, 18, 20, 156], "frametim": [137, 138, 139, 140, 141, 146, 147], "framework": [14, 17, 20, 136, 148, 156, 169], "franuka": 153, "free": [131, 135, 136, 137, 140, 141, 142, 143, 148, 169, 174, 177], "free_body_rot": 146, "freedom": [140, 141, 142, 167], "freejoint": [140, 141], "freez": [14, 18, 19], "frequenc": 17, "frequent": [155, 166], "friction": [127, 146, 147, 148], "frictionless": 132, "from": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 127, 128, 129, 131, 136, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 160, 161, 162, 163, 166, 169, 173, 174, 175, 177, 178], "from_json": [5, 156], "front": [137, 138, 146, 147], "front_left_leg": 137, "front_right_leg": 137, "frontpag": 156, "frozen": [149, 155, 156, 175], "frozen_lak": [153, 175], "frozenlak": [9, 153, 155, 156, 170, 171, 176], "frozenlake4x4": 156, "frozenlake8x8": [153, 155, 156], "frozenlake_q_learn": 175, "frozenset": 7, "fshin": 138, "fthigh": 138, "fuel": 129, "full": [3, 4, 128, 129, 155, 156, 158, 159, 174], "fulli": [2, 129, 137, 138, 139, 140, 141, 143, 146, 147, 148, 155], "fun": [174, 177], "func": [3, 14, 16, 18, 19, 156], "func_env": 3, "funcenv": [3, 156], "funcjaxenv": 156, "function": [2, 8, 10, 11, 12, 14, 16, 17, 18, 19, 20, 129, 132, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 154, 155, 156, 158, 163, 166, 167, 169, 171, 174, 175, 177, 178], "functional_jax_env": 3, "functionaljaxenv": 3, "fundament": [159, 161, 163, 164, 168, 170], "furcolor": 9, "further": [2, 5, 7, 129, 144, 145, 155, 156, 175, 177], "furthermor": [2, 9, 156, 158], "furthest": 127, "futur": [3, 155, 156, 160, 163, 173], "future_q_valu": [163, 174], "g": [1, 2, 4, 5, 7, 8, 9, 11, 12, 13, 20, 131, 135, 137, 138, 139, 140, 141, 143, 146, 147, 148, 153, 154, 155, 156, 165, 167, 174, 175, 177, 178], "ga": 128, "gae": 178, "gaetanlepag": 156, "gain": [156, 167], "galleri": [1, 156], "game": [7, 9, 17, 126, 150, 151, 152, 153, 155, 156, 158, 159, 160, 163, 165, 174], "gamma": [14, 19, 160, 166, 175, 177, 178], "gap": 148, "garbag": [10, 11, 12, 17, 156], "gather": 165, "gaussian": 136, "gc_trigger": 17, "gcc": 148, "gen_gif": 1, "gen_md": 1, "gener": [1, 2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 13, 15, 17, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 159, 161, 162, 173, 178], "generalis": [2, 10], "generate_random_map": [153, 175], "geometr": [6, 136], "geometri": 156, "get": [2, 4, 11, 12, 14, 15, 18, 19, 127, 129, 136, 137, 139, 140, 142, 150, 155, 156, 158, 159, 161, 165, 166, 169, 173, 174, 175, 178], "get_act": [163, 174], "get_attr": [11, 12, 156], "get_env_id": 4, "get_loss": 178, "get_moving_avg": 163, "get_rect": 165, "get_stat": 155, "get_wrapper_attr": [15, 156], "gianluca": 156, "gianlucadecola": [155, 156], "giant": 163, "gif": [1, 131, 156], "git": [165, 169], "github": [19, 129, 132, 136, 137, 139, 140, 141, 142, 143, 144, 145, 147, 151, 152, 155, 156, 160, 165, 169, 171], "give": [2, 10, 129, 137, 150, 154, 155, 158, 159, 174, 177, 178], "given": [3, 4, 5, 7, 16, 127, 129, 130, 131, 132, 133, 134, 137, 139, 140, 142, 143, 147, 155, 156, 166, 174], "glfw": 136, "global": 4, "gnn": 148, "go": [2, 9, 128, 148, 150, 155, 159, 162, 163, 166, 169, 174, 177, 178], "go1": 169, "goal": [2, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 159, 160, 163, 165, 177], "goal_slidei": 144, "goal_slidex": 144, "goal_veloc": [133, 134], "godsboy404": 156, "goe": [150, 155, 163], "gone": 155, "good": [158, 159, 163, 174, 175, 178], "googl": [155, 169], "goul\u00e3o": 156, "gp": 148, "gpu": [136, 148, 156, 162, 178], "gracefulli": 155, "gradient": [177, 178], "gradual": [158, 161, 163], "grai": 17, "grammat": 156, "grant": 129, "graph": [5, 6, 8, 13, 148, 155, 156, 158, 174, 178], "graphic": [136, 155], "graphinst": [6, 8, 13, 155, 156], "grasp": 148, "grave": 178, "gravit": 129, "graviti": [129, 132, 133, 135, 142, 143, 148, 177, 178], "grayscal": [14, 17, 18, 20], "grayscale_env": 18, "grayscale_newaxi": 17, "grayscale_ob": 17, "grayscaleobserv": [14, 18, 20], "great": [148, 167, 174], "greater": [129, 131, 132, 133, 134, 143, 150, 174], "greedi": [163, 173, 174, 175], "greedili": 174, "green": [131, 154], "grei": 174, "greyscal": 17, "grid": [148, 151, 152, 153, 154, 159, 161, 165, 173, 174], "grid_world": 165, "gridlin": 165, "gridworld": [2, 148, 151, 152, 158, 165], "gridworldenv": [159, 165], "griesbach": 156, "grip": 174, "ground": [127, 129, 141, 148], "group": [129, 155], "grow": 161, "gt": [155, 156], "guarante": [5, 6, 13, 17, 148, 171], "guess": 155, "guid": [148, 156, 157, 159, 169], "guidelin": 17, "guyazran": 156, "gym": [2, 5, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 126, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 156, 157, 158, 159, 161, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "gym4real": 148, "gymfc": 148, "gymlibrari": 155, "gymnasium": [2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 157, 159, 160, 161, 162, 163, 166, 169, 172, 173, 174, 175, 176, 177, 178], "gymnasium_env": [159, 165], "gymnasium_robot": [136, 156, 160], "gymnax": 148, "gymv21compat": 156, "gymv21environ": 160, "gymv22compat": 156, "gymv22environ": 156, "gymv26environ": 160, "gyroscop": 128, "h": 153, "h5": 178, "ha": [1, 2, 4, 5, 7, 8, 9, 10, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 139, 140, 141, 144, 145, 146, 148, 150, 154, 155, 156, 157, 158, 159, 163, 165, 166, 169, 173, 174, 175, 177, 178], "hacki": 13, "had": [2, 155, 156], "half": 136, "half_cheetah": 138, "halfcheetah": [14, 136, 138], "halt": 166, "hand": [148, 150, 163, 177], "handl": [5, 10, 11, 12, 142, 150, 155, 156, 158, 160, 163, 168, 170, 174], "handling_time_limit": 166, "hang": [13, 131, 155], "hannah": 156, "happen": [133, 134, 137, 139, 140, 142, 143, 147, 150, 153, 154, 155, 156, 158, 159, 163, 166], "haracterist": 177, "hard": [156, 159, 160, 175], "hardcor": 127, "harden": [155, 156], "harder": [129, 169], "hardwar": [148, 155, 156], "harlei": 178, "harm": 174, "hasattr": 156, "hash_se": 155, "hasselmo": 131, "hatchl": 165, "have": [2, 4, 5, 7, 8, 10, 11, 13, 14, 15, 16, 17, 18, 126, 127, 128, 131, 137, 140, 141, 142, 143, 144, 145, 147, 150, 153, 154, 155, 156, 158, 159, 160, 163, 165, 166, 167, 169, 174, 175, 177, 178], "haven": 17, "head": [11, 138, 160], "headless": [136, 155], "healthi": [137, 139, 140, 142, 143, 147], "healthy_angle_rang": [139, 147], "healthy_reward": [137, 139, 140, 142, 143, 147, 169], "healthy_state_rang": 139, "healthy_z_rang": [137, 139, 140, 147, 169], "heart": [158, 163], "heatmap": [174, 175], "height": [131, 136, 137, 139, 140, 142, 147, 155, 156, 169], "held": 150, "hello": 7, "help": [2, 4, 5, 9, 155, 156, 158, 161, 164, 168, 170, 173, 174, 178], "helper": [155, 159], "helpingstar": 156, "henc": [137, 149, 177], "here": [3, 9, 131, 137, 140, 155, 156, 159, 161, 163, 165, 169, 178], "heurist": [127, 129, 148, 156], "hffg": 153, "hidden": [2, 177], "hidden_space1": 177, "hidden_space2": 177, "hierarch": [5, 154], "high": [2, 6, 7, 8, 11, 12, 13, 14, 18, 131, 132, 134, 135, 137, 148, 155, 156, 158, 163, 167, 169, 178], "higher": [19, 127, 144, 163, 169, 173, 178], "highest": [4, 163], "highli": [5, 9, 126, 130, 148, 155, 165], "highwayenv": [148, 156], "hill": [133, 134], "hing": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "hinge2": 142, "hint": [155, 156], "hinter": 155, "hip": [127, 137, 140, 141], "hip_1": 137, "hip_2": 137, "hip_3": 137, "hip_4": 137, "histor": [148, 159], "histori": 136, "histplot": 175, "hit": [150, 158, 159, 163, 174], "hold": [5, 150, 174], "hole": [153, 175], "homepag": 156, "hood": 156, "hook": [155, 156], "hooper": 156, "hop": [136, 139, 147], "hope": 156, "hopefulli": [155, 174], "hopper": [15, 16, 136, 147, 156], "hopper_v4": 15, "hopperenv": 15, "horizon": [9, 139, 148, 166], "horizon_timestep": 9, "horizont": [127, 129, 131, 159, 165], "host": 156, "hot": 8, "hotter": 155, "hour": 161, "hous": 163, "how": [2, 5, 6, 9, 11, 12, 14, 141, 142, 144, 145, 148, 156, 158, 159, 160, 161, 163, 165, 166, 167, 171, 174, 178], "howardh": 156, "howev": [2, 5, 6, 7, 8, 9, 10, 11, 13, 16, 17, 131, 137, 138, 139, 140, 141, 145, 146, 147, 155, 156, 158, 165, 166, 167, 174, 178], "hpo": 171, "html": [18, 177], "http": [1, 2, 10, 11, 12, 18, 19, 128, 131, 150, 151, 152, 153, 155, 156, 165, 169, 174, 175, 177, 178], "hue": 175, "huge": [148, 155], "hull": 127, "human": [2, 6, 9, 17, 20, 128, 136, 140, 141, 144, 148, 155, 156, 157, 158, 159, 160, 165, 169, 178], "humanoid": [136, 156, 169, 171], "humanoidstandup": [136, 141], "humanoidstandup_v4": 155, "humanrend": [17, 20, 156], "humnaoid": 169, "hundr": 161, "hundredth": 17, "hyperparam": 178, "hyperparamet": [161, 163, 171, 173, 174, 175, 177, 178], "i": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 126, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 172, 173, 174, 175, 176, 177, 178], "i_": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "ianyfan": 156, "ic": 153, "ice1187": 155, "iclr": 178, "icml": 178, "icu": 148, "id": [4, 17, 136, 137, 140, 141, 153, 156, 159, 165], "idea": [158, 166, 174], "ident": [7, 11, 12, 136, 156], "identifi": [155, 161], "idx": 175, "if__name__": 178, "iff": [9, 17, 165], "iforce2d": 128, "igibson": 148, "ignor": [1, 9, 150, 155, 160, 163, 174], "ikamensh": [155, 156], "illeg": 154, "illustr": [14, 165, 166], "im": 143, "imag": [2, 5, 10, 11, 12, 14, 17, 18, 20, 128, 136, 156, 158, 169], "imagesequenceclip": 9, "imagin": [148, 158, 167], "img": 173, "immedi": [9, 19, 20, 137, 139, 140, 141, 147, 150, 158, 159, 163, 165], "immut": 5, "impact": [141, 160, 175], "impact_cost": 141, "impact_cost_rang": 141, "impact_cost_weight": 141, "implement": [5, 6, 9, 10, 15, 16, 17, 20, 129, 132, 135, 142, 148, 149, 155, 156, 158, 159, 160, 161, 163, 164, 165, 168, 170, 171, 172, 173, 176, 177, 178], "implementing_custom_wrapp": 167, "implic": 160, "implicitli": 178, "import": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 163, 165, 167, 169, 173, 175, 177, 178], "importantli": [15, 156, 158], "importerror": 156, "imposs": [159, 163, 173], "improv": [11, 155, 156, 158, 160, 161, 162, 173], "imshow": 175, "inaccur": 163, "includ": [2, 4, 14, 17, 18, 20, 132, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 154, 155, 156, 158, 159, 161, 165, 166, 169, 171], "include_cfrc_ext_in_observ": [137, 140, 141, 169], "include_cinert_in_observ": [140, 141], "include_cvel_in_observ": [140, 141], "include_qfrc_actuator_in_observ": [140, 141], "inclus": [137, 155], "incompleteidea": [150, 151, 152], "inconsist": 160, "incorpor": 148, "incorrect": [154, 155, 156, 159, 166], "incorrectli": [19, 156], "increas": [129, 131, 132, 136, 139, 144, 146, 147, 156, 162, 163, 174, 175, 178], "incur": [131, 151, 152, 154], "independ": [6, 7, 10, 129, 139, 146, 147, 156, 173], "index": [1, 6, 9, 13, 14, 17, 18, 20, 132], "indic": [2, 9, 14, 17, 128, 131, 132, 150, 151, 152, 153, 154, 155, 163, 166, 173, 174, 175, 177], "individu": [2, 11, 12, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 155, 159, 165, 167, 173, 177], "indoril007": 155, "induc": [137, 138, 139, 140, 141, 146, 147], "induct": [137, 138, 139, 140, 141, 146, 147], "ineffici": [156, 162], "inelast": [133, 134], "inertia": [140, 141], "inf": [2, 10, 16, 18, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 158, 167, 169], "infam": 174, "infeas": 7, "infer": [7, 155], "infinit": [16, 17, 18, 129, 139, 150, 155, 156, 158, 159, 163, 166, 174], "info": [2, 3, 9, 10, 11, 12, 14, 17, 18, 19, 20, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 157, 158, 159, 160, 161, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "inform": [1, 2, 5, 6, 7, 9, 10, 11, 12, 18, 20, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 159, 160, 163, 165, 166, 169, 174, 177], "infti": [7, 139], "inher": 166, "inherit": [4, 5, 15, 16, 18, 19, 155, 156, 159, 165], "init": [128, 159, 161, 165, 178], "initi": [2, 3, 4, 6, 7, 9, 10, 14, 15, 16, 17, 18, 19, 127, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 159, 161, 163, 167, 169, 173, 174, 175, 177, 178], "initial_epsilon": [163, 174], "initial_sampl": 156, "initialis": [2, 4, 10, 17, 150, 156, 157], "inlin": 178, "inner": 11, "inner_st": 6, "inplac": 177, "input": [9, 10, 156, 158, 159, 174, 178], "inregular": 17, "insert": [157, 177], "insid": [1, 6, 7, 17, 148, 154, 159, 165], "insight": [148, 158, 163], "inspect": 9, "inspir": [151, 152, 156, 175], "instabl": [162, 163], "instal": [1, 9, 17, 126, 130, 136, 155, 156, 158, 160, 165, 169], "instanc": [2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 17, 18, 156, 158, 159, 162, 167, 178], "instanti": [9, 14, 17, 18, 19, 165, 175], "instead": [2, 10, 11, 14, 15, 127, 131, 137, 140, 147, 155, 156, 158, 159, 160, 161, 163, 165, 178], "institut": [133, 134], "instruct": [136, 148, 156, 165], "insuffici": 163, "int": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 136, 137, 150, 151, 152, 153, 154, 156, 159, 163, 165, 173, 174, 175, 177, 178], "int23": 17, "int32": [6, 8, 10, 14, 18, 159], "int64": [6, 7, 8, 156, 159], "int8": [5, 7], "int_32": 17, "integ": [2, 6, 7, 8, 9, 14, 16, 17, 18, 155, 156, 159, 165], "integr": [9, 156, 169], "intellig": [154, 155, 158, 163], "intend": [3, 14, 17, 148, 151, 152, 153, 154, 171, 175], "intens": 148, "interact": [5, 9, 14, 17, 20, 148, 158, 159, 163, 165, 174, 178], "interest": [18, 156, 161, 169], "interestingli": 175, "interfac": [9, 156, 157, 158], "interlink": 158, "intermedi": [140, 141, 159], "intermitt": 17, "intern": [2, 3, 10, 155, 156, 159, 160, 161], "internet": 148, "interoper": 148, "interv": [7, 137, 139, 140, 147, 161], "intrins": 167, "introduc": [137, 140, 141, 148, 155, 156, 160], "introduct": [131, 150, 151, 152, 175], "introductori": 156, "invalid": [2, 7, 156, 159, 169, 173, 174], "invers": 4, "invert": [135, 136, 177], "inverted_double_pendulum": 142, "inverted_pendulum": [143, 177], "inverteddoublependulum": [136, 142], "invertedpendulum": [136, 143, 177], "investig": 156, "involv": [6, 126, 142, 148, 151, 152, 153, 154, 155, 156, 165, 177], "io": [18, 148, 153], "ipynb": [165, 166, 167, 169, 173, 174, 175, 177, 178], "irrelev": 159, "irrespect": 9, "is_avail": 178, "is_bound": 7, "is_np_flatten": [5, 156], "is_rain": 154, "is_raini": 154, "is_slipperi": [151, 152, 153, 156, 175], "is_slippi": 156, "is_vector_env": 9, "isaac": 148, "isinst": 156, "isn": [6, 9, 156, 159, 161], "isort": 156, "issu": [17, 18, 129, 132, 136, 137, 139, 140, 141, 142, 143, 144, 145, 147, 155, 156, 160, 161, 165], "itch": 153, "item": [9, 13, 18, 174, 175, 178], "iter": [5, 6, 12, 13, 156, 159], "itomori": 148, "its": [2, 9, 16, 17, 129, 135, 136, 137, 139, 141, 144, 147, 148, 156, 158, 160, 175, 177, 178], "itself": [3, 8, 10, 11, 12, 15, 17, 155, 156, 158, 159, 160, 178], "j": [156, 177, 178], "jack": 150, "jair": 154, "jamartinh": 156, "jax": [2, 14, 17, 20, 148, 156, 162], "jax_to_numpi": 156, "jaxenv": [14, 17], "jaxtonumpi": [14, 17, 20, 156], "jaxtotorch": [14, 17, 20, 156], "jessefarebro": 155, "jet": 156, "jfpettit": 155, "jimini": 148, "jin": 156, "jit": 162, "jjshoot": [155, 156], "jkterry1": 155, "jnp": 17, "job": [148, 165], "job_statu": 6, "john": 156, "johnminelli": 155, "johnnycode8": 171, "join": [5, 156], "joint": [127, 129, 131, 132, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "joint0": 145, "joint1": 145, "jordan": [137, 156, 178], "journal": 154, "journei": [155, 174], "json": 156, "json_env_spec": 156, "jsonabl": 5, "jump": 169, "jumpi": 156, "jun": 156, "junk": 14, "jupyt": [1, 155, 165, 166, 167, 169, 170, 173, 174, 175, 177, 178], "just": [3, 13, 15, 143, 145, 155, 156, 158, 159, 160, 162, 163, 165, 169, 178], "k": [8, 9, 14, 129, 146, 156, 178], "kad99kev": 156, "kalli": 169, "kallinteri": [156, 169], "karp": 178, "kavukcuoglu": 178, "kde": 175, "keep": [9, 14, 17, 18, 20, 132, 141, 143, 159, 163, 165], "keep_dim": [14, 18], "kei": [2, 4, 5, 6, 7, 9, 10, 14, 17, 18, 20, 137, 138, 139, 140, 141, 146, 147, 151, 152, 153, 154, 155, 156, 158, 163, 165, 166, 167, 173, 174, 175], "kellycoinflip": 155, "kept": [10, 136, 169], "kerajli": 156, "kexianshen": 155, "key_to_act": 9, "keyb0ardninja": 156, "keyboard": [7, 9, 155], "keys_to_act": [9, 155, 178], "keyword": [4, 6, 10, 11, 12, 14, 131, 132, 150, 155, 156, 158, 165, 174], "kg": [155, 156], "khoda81": 156, "kind": 7, "king": 150, "kir0ul": [155, 156], "klimov": [126, 127, 128, 129], "knee": [127, 140, 141], "know": [2, 156, 158, 159, 160, 162, 163, 165], "knowledg": [4, 163], "known": [2, 163], "krimmel": 156, "kvrban": 156, "kwarg": [3, 4, 9, 10, 11, 12, 14, 15, 137, 138, 139, 140, 146, 147, 156, 165], "kwiatkowski": 156, "l": [14, 17, 146, 156, 161], "l2r": 148, "lab_black": 175, "label": [161, 173, 174, 175], "laboratori": 148, "lack": 156, "ladder": 127, "lai": 141, "lake": [149, 155, 156], "lam": 178, "lambaactionv0": 156, "lambda": [11, 12, 14, 16, 17, 18, 19, 156, 161, 163, 174, 178], "lambdaact": 14, "land": 129, "lander": [126, 155, 156], "lane": 148, "lap": [128, 155], "lap_complete_perc": 128, "larg": [11, 129, 134, 137, 138, 139, 140, 141, 144, 145, 146, 147, 148, 155, 156, 162, 163, 167, 169, 175], "larger": [163, 178], "largest": 155, "last": [9, 13, 14, 17, 18, 20, 141, 144, 145, 155, 156, 161, 165, 166, 175], "latent": 148, "later": [129, 158, 159, 161, 163, 174, 177, 178], "latest": [2, 162, 177], "latin": 7, "latter": [151, 152], "lava": 2, "layer": [3, 15, 158, 159, 177], "lazili": 5, "lazyfram": 18, "lead": [160, 178], "learn": [2, 5, 6, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 138, 142, 143, 146, 148, 149, 150, 151, 152, 154, 155, 156, 157, 161, 162, 165, 169, 170, 171, 173, 176, 178], "learner": 175, "learning_r": [163, 173, 174, 175, 177], "learnt": 4, "least": [7, 129, 136], "leav": [132, 142, 165, 175], "left": [7, 127, 128, 129, 132, 133, 137, 140, 141, 142, 143, 147, 151, 152, 153, 154, 158, 159, 165, 169, 173, 174, 175, 177], "left_elbow": [140, 141], "left_elfbow": [140, 141], "left_foot": [140, 141], "left_hip_i": [140, 141], "left_hip_x": [140, 141], "left_hip_z": [140, 141], "left_hiz_z": [140, 141], "left_kne": [140, 141], "left_lower_arm": [140, 141], "left_shoulder1": [140, 141], "left_shoulder2": [140, 141], "left_sin": [140, 141], "left_thigh": [140, 141], "left_upper_arm": [140, 141], "leg": [127, 129, 137, 139, 140, 141, 147], "leg_joint": [139, 147], "leg_left_joint": 147, "legaci": 155, "legend": [161, 173, 174, 175], "legend_el": 174, "len": [6, 17, 161, 163, 167, 173, 174, 178], "length": [4, 6, 7, 9, 11, 12, 14, 17, 20, 127, 131, 132, 133, 134, 146, 148, 153, 154, 155, 156, 158, 161, 163, 174, 178], "length_mask": 6, "length_moving_averag": [163, 174], "length_queu": [14, 17, 161, 163, 174], "leq": 142, "less": [127, 129, 146, 147, 158, 163, 175], "lesson": 175, "let": [148, 156, 158, 159, 163, 165, 167, 173, 174, 175, 177], "letter": [153, 154, 155], "level": [9, 15, 158, 161, 169], "levin": [137, 178], "lg": 156, "li": [141, 156], "lib": [151, 152], "librari": [148, 156, 157, 165, 169], "licens": [155, 156, 165, 174, 175, 177, 178], "lidar": 127, "life": [17, 155, 156, 177], "lift": 144, "light": 148, "lighter": 156, "lightgreen": 174, "lightli": 160, "lightweight": [148, 161], "ligibl": 177, "like": [3, 5, 7, 9, 13, 14, 15, 16, 17, 18, 19, 20, 138, 143, 147, 148, 154, 155, 156, 158, 159, 161, 163, 165, 167, 169, 171, 178], "lillicrap": 178, "limit": [17, 20, 132, 143, 155, 156, 158, 159, 160, 162, 163, 168, 170, 174, 177, 178], "lin826": 155, "linalg": [9, 159, 165], "line": [2, 5, 131, 155, 156, 159, 165], "linear": [10, 129, 131, 142, 143, 146, 177, 178], "linearli": [14, 16, 18, 20, 131, 142, 143, 177], "linecolor": 175, "lineplot": [175, 177], "linewidth": [161, 173, 174, 175], "link": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 131, 137, 145, 146, 156, 165], "linux": 156, "list": [2, 4, 5, 6, 7, 9, 10, 11, 12, 14, 15, 17, 18, 155, 156, 158, 159, 161, 174, 175, 178], "list_info": 14, "listdir": 17, "liter": 156, "littl": [129, 156, 159, 163], "live": [1, 9, 159, 174], "ll": [155, 158, 159, 161, 163, 173, 174, 178], "llvm": 148, "load": [4, 155, 156, 168, 170], "load_env_cr": 4, "load_ext": 175, "load_quadruped_model": 169, "load_state_dict": 178, "load_weight": 178, "loc": [154, 178], "local": 165, "localhost": 1, "locat": [4, 136, 148, 151, 152, 153, 154, 159, 165, 173], "log": [2, 9, 14, 16, 17, 18, 19, 161, 175, 177, 178], "log_prob": [177, 178], "logan": 156, "logger": [17, 155], "logic": [11, 128, 155, 156, 159, 163, 165, 169], "logical_or": 156, "logit": 178, "long": [7, 9, 17, 132, 143, 148, 155, 156, 159, 161, 163], "longer": [2, 136, 137, 139, 143, 147, 155, 156, 160, 177], "look": [5, 9, 17, 158, 160, 161, 165, 166, 167, 175, 178], "loop": [148, 160, 174, 178], "lose": [129, 150, 163, 174], "loss": [17, 150, 163, 177, 178], "lost": 17, "lot": [15, 163, 167, 174, 177], "low": [2, 6, 7, 8, 12, 13, 14, 18, 131, 132, 134, 135, 155, 156, 163, 167, 173, 178], "lower": [7, 14, 15, 19, 20, 140, 141, 155, 158, 163, 174, 178], "lower_waist": [140, 141], "lpizzinidev": 156, "lr": [163, 174, 175, 177, 178], "lt": [155, 156], "lucasalegr": 156, "lunar": [126, 155, 156], "lunar_land": [129, 156], "lunarland": [17, 129, 155, 156, 157, 160, 163, 178], "lunarlandercontinu": 167, "lwaist": [140, 141], "lz4": 18, "m": [8, 131, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 169, 178], "mab": 148, "machado": [16, 17], "machin": [155, 175, 177], "made": [1, 129, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 160, 169, 171, 178], "magnitud": [9, 129, 134, 142, 143, 177], "mahiuchun": 155, "mai": [2, 5, 7, 8, 9, 11, 14, 15, 16, 18, 19, 151, 152, 153, 158, 160, 165, 169, 178], "main": [2, 129, 139, 147, 156, 160, 169, 175], "main_bodi": [137, 169], "mainli": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "maintain": [136, 148, 155, 156, 157, 160, 171, 173], "mainten": 155, "major": [155, 156], "make": [1, 2, 6, 9, 11, 12, 15, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 160, 161, 163, 167, 168, 169, 170, 173, 174, 175, 177, 178], "make_dict": 14, "make_vec": [2, 4, 9, 10, 11, 12, 14, 132, 156, 159, 162, 178], "malici": 156, "manag": [4, 13, 148, 163], "mandatori": [159, 165], "manhattan": [159, 165], "mani": [7, 14, 17, 136, 148, 155, 156, 159, 160, 163, 165, 174, 175], "manipul": 148, "manner": [3, 7, 18, 20, 155], "mantasu": 156, "manual": [9, 14, 158, 178], "manual_se": 177, "manuel": 156, "manufactur": 169, "map": [9, 14, 17, 153, 154, 156, 158, 159, 163, 165, 174, 177], "map_nam": 153, "map_siz": 175, "mar": [148, 156], "mariojerez": 156, "marionj": 156, "mark": 156, "markdown": 1, "market": 148, "markov": [148, 156, 158, 166], "markovian": 148, "marku": 156, "markus28": [155, 156], "marsexplor": 148, "mask": [5, 6, 7, 148, 154, 155, 156, 170, 176, 178], "masked_mean_curv": 173, "masked_mean_reward": 173, "masked_overall_mean": 173, "masked_overall_std": 173, "masked_result": 173, "masked_results_list": 173, "mass": [129, 137, 140, 141, 146], "massiv": 155, "master": [18, 151, 152, 155, 158, 177], "match": [4, 8, 11, 12, 16, 132, 156], "math": [135, 148, 155, 163], "mathbb": 7, "mathcal": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "mathemat": [5, 158, 177], "matplotlib": [9, 161, 163, 173, 174, 175, 177, 178], "matpoliquin": 156, "matric": [5, 148], "matrix": [6, 140, 141, 148], "matter": [7, 155, 159, 160], "matyasch": 156, "max": [4, 7, 14, 16, 17, 18, 20, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 153, 156, 163, 173, 174, 175, 177, 178], "max_a": 166, "max_act": [14, 15, 16, 20], "max_episode_step": [4, 17, 156, 159, 165, 169, 178], "max_geom": 136, "max_id": 175, "max_length": 7, "max_ob": [14, 18, 20], "max_reward": [10, 14, 19, 156, 167], "max_time_step": [132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "maxandskipenv": 18, "maxandskipobserv": [18, 20, 156], "maxim": [159, 163, 177, 178], "maximis": 162, "maximum": [4, 7, 9, 14, 17, 18, 20, 129, 131, 135, 142, 156, 158, 163, 165, 173, 175, 178], "maxq": 154, "mayb": [2, 175], "maze": 159, "mclean": 156, "md": [1, 155, 156, 165], "mdp": [2, 17, 133, 134, 148, 158], "mean": [2, 14, 18, 19, 20, 131, 139, 144, 155, 156, 163, 165, 173, 175, 177, 178], "mean_reward": 173, "meaning": 163, "meant": 3, "meantim": 156, "measur": [9, 127, 135, 141, 142, 144, 145, 155, 159], "mechan": 156, "medium": 148, "mel": 153, "melbourn": 175, "melt": 177, "member": 5, "memori": [5, 17, 133, 134, 155, 156, 161, 162], "menageri": 169, "mention": [156, 177], "menu": 158, "mere": 165, "merg": 156, "meshcat": 148, "meshgrid": 174, "messag": [5, 155, 156, 161], "meta": [148, 155], "metaclass": 155, "metadata": [2, 3, 9, 10, 15, 17, 155, 156, 165, 167], "metatrad": 148, "metaworld": 148, "meter": [135, 148], "meth": [7, 17], "method": [3, 4, 6, 9, 14, 16, 17, 18, 19, 148, 155, 156, 159, 160, 163, 165, 167, 177, 178], "methodologi": 148, "metric": [2, 9, 156, 161, 178], "mgoulao": 156, "micim": 155, "microgrid": 148, "mid": 160, "middl": [139, 147, 163], "might": [2, 5, 7, 8, 15, 16, 158, 159, 162, 165, 167, 174, 177, 178], "migrat": [136, 156, 157], "mihaic": 156, "mileston": 161, "miller": 175, "min": [7, 14, 16, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "min_act": [14, 15, 16, 20], "min_length": 7, "min_ob": [14, 18, 20], "min_reward": [10, 14, 19, 156, 167], "minari": 148, "minatari": 148, "mind": 156, "mine": 148, "minecraft": 148, "minesweep": 148, "minetest": 148, "miniatur": 148, "minibatch": 178, "minigrid": [148, 156], "minim": [2, 148, 156, 159, 165, 166, 175, 178], "minimalist": 148, "minimum": [7, 14, 18, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 158, 159, 163, 175], "miniwob": 148, "miniworld": 148, "minor": [155, 156], "mirza": 178, "misc": [155, 156], "mischapanch": 156, "miss": [131, 154, 155, 156, 158, 159, 161], "mission": 5, "mistak": [156, 158, 159], "mit": [131, 174, 175, 177, 178], "mitig": 178, "mixtur": 156, "mj_camera": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "mj_step": [137, 140], "mjcf": 169, "mjdata": 136, "mjtvisflag": 136, "mjvcamera": 136, "mjvis_contactforc": 136, "mjvis_contactpoint": 136, "mjvisual": 136, "mkdir": [173, 178], "ml": [148, 155], "mmcaulif": 156, "mnih": 178, "mo": 148, "moba": 148, "mobil": 148, "modal": 136, "mode": [2, 4, 10, 11, 12, 14, 155, 156, 158, 161, 163, 165, 174, 178], "model": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 156, 159, 160, 171, 174], "modern": [148, 160], "modif": 167, "modifi": [2, 4, 5, 10, 14, 15, 16, 18, 19, 20, 131, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 159, 165, 167], "modul": [4, 5, 13, 155, 156, 165, 167, 177, 178], "modular": [14, 15, 148, 158, 165, 167], "module_nam": 156, "moduletyp": [14, 17], "mojoco": 171, "moment": 3, "monitor": [17, 155, 156, 161], "monop": 136, "mont": [163, 174, 177, 178], "month": 156, "moon": 129, "moor": [133, 134], "moore90efficientmemori": [133, 134], "more": [1, 2, 5, 6, 7, 10, 11, 12, 14, 15, 16, 19, 20, 127, 129, 136, 137, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 160, 162, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "moreov": [5, 14, 15, 17, 165, 167], "moritz": [137, 178], "most": [2, 5, 7, 13, 14, 15, 17, 18, 136, 145, 148, 155, 156, 158, 160, 162, 163, 165, 167, 169, 170, 172, 174, 176], "mostli": [155, 163], "motion": 148, "motor": [127, 146, 148, 155, 169], "motor1_rot": 146, "motor2_rot": 146, "mountain": [130, 155, 158], "mountaincar": [14, 133, 163, 171], "mountaincarcontinu": [14, 16, 19, 134], "mountaincarenv": 133, "move": [2, 14, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 129, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 153, 154, 155, 156, 158, 159, 160, 161, 163, 165, 166, 169, 173, 175, 177], "movement": [154, 159, 163, 165], "moviepi": [9, 17, 155, 156], "moving_avg": 161, "mozer": 131, "mp": 13, "mp4": 161, "mpi": 13, "mpi4pi": 13, "mpi_init": 13, "mt19937": 155, "mtsim": 148, "much": [155, 156, 159, 160, 163, 165, 166, 169], "mujoco": [1, 9, 15, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 167, 169, 170, 176], "mujoco_env": [155, 156], "mujoco_gl": 136, "mujoco_menageri": 169, "mujoco_reinforc": 177, "mujoco_rend": 155, "mujocoenv": 156, "mujocorend": 156, "mujocorender": 156, "multi": [2, 7, 136, 140, 141, 144, 148, 159], "multiag": 148, "multibinari": [5, 6, 7, 8, 13, 18, 156, 158], "multidiscret": [5, 6, 7, 8, 10, 13, 18, 155, 156, 158, 165], "multimod": 148, "multipl": [5, 6, 7, 10, 11, 12, 13, 155, 156, 158, 159, 161, 162, 173, 178], "multipli": [6, 129, 134, 144, 145, 178], "multiprocess": [5, 11, 13, 178], "multivari": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "must": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 128, 136, 139, 147, 155, 156, 159, 163, 165, 166], "mutual": 136, "my": 175, "my_packag": 159, "mypi": [2, 156], "n": [4, 5, 6, 7, 8, 11, 12, 13, 17, 18, 20, 128, 131, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 161, 163, 173, 174, 175, 177, 178], "n_action": [173, 178], "n_env": 178, "n_episod": [163, 174], "n_featur": 178, "n_run": [173, 175], "n_showcase_episod": 178, "n_state": 173, "n_steps_per_upd": 178, "n_updat": 178, "na": 145, "name": [1, 3, 4, 11, 12, 15, 20, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 159, 161, 165], "name_prefix": [9, 17, 161], "namedtupl": [156, 175], "namespac": [4, 159, 165], "nanoquadrotor": 148, "narrow": 175, "nativ": 17, "natur": [148, 150, 153, 160, 163, 174], "naverag": 161, "navig": [148, 154, 159, 165, 167], "nbodi": [137, 140, 141], "nchain": 155, "ncol": [151, 152, 153, 163, 174, 175, 178], "ncrement": 177, "ndarrai": [2, 3, 6, 7, 8, 9, 13, 14, 16, 17, 18, 19, 131, 132, 133, 134, 135, 154, 177, 178], "neccari": 9, "necessari": [2, 5, 126, 155, 156, 173], "necessarili": 8, "need": [2, 5, 6, 9, 14, 15, 16, 18, 127, 129, 132, 136, 155, 156, 158, 159, 160, 161, 162, 163, 165, 166, 167, 169, 173, 174, 175, 178], "need_visu": 160, "neg": [2, 7, 9, 134, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 154, 158, 159, 163, 177], "neither": [7, 17, 150, 154], "nerdyespresso": 156, "nervous": 127, "nest": [6, 13, 148], "net": [128, 150, 151, 152, 177, 178], "network": [5, 8, 10, 13, 146, 148, 158, 159, 163, 178], "neural": [5, 8, 10, 13, 131, 146, 148, 159, 163, 177, 178], "neurip": 131, "neuro": 148, "neuroflight": 148, "neuronlik": [132, 142, 143], "nevalu": 161, "never": [2, 138, 141, 144, 145, 146, 156, 173], "nevertheless": 167, "new": [2, 5, 14, 15, 16, 17, 18, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 146, 147, 154, 155, 156, 157, 158, 159, 162, 163, 165, 166, 167, 169, 174, 175, 178], "new_action_spac": 14, "new_obs_spac": 14, "new_po": 159, "new_q": 163, "new_spac": 14, "new_stat": 175, "new_throughput": 9, "newer": [136, 155], "newli": [14, 18, 19], "newlin": 2, "next": [2, 3, 10, 13, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 156, 157, 169, 173, 177], "next_mask": 173, "next_max": 173, "next_ob": [156, 160, 163, 174, 177], "next_stat": [3, 156, 163, 173, 174], "next_step": [11, 12], "next_valu": 160, "nice": 155, "nidhish": 156, "nine": 137, "nintendo": 7, "nip": 131, "nlp": 148, "nlpgym": 148, "nn": [177, 178], "no_grad": 178, "node": [5, 6, 8, 155, 158], "node_spac": [6, 8], "nois": [130, 136, 156], "noisi": [161, 163], "non": [2, 5, 8, 9, 14, 17, 129, 132, 137, 138, 139, 140, 141, 146, 147, 148, 153, 155, 156, 159, 165, 166, 177], "non_random_ob": 128, "nonbreak": 155, "nondeterminist": [4, 165], "none": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 136, 153, 155, 156, 158, 159, 160, 165, 173, 174, 175, 178], "nonlinear": 139, "nonzero": 173, "noop": [7, 9, 17, 154, 156, 178], "noop_max": [17, 156], "nor": [7, 17, 150, 151, 152, 154], "norm": [9, 144, 145, 159, 165], "normal": [2, 4, 7, 10, 13, 14, 17, 18, 19, 20, 127, 128, 135, 137, 138, 142, 155, 156, 162, 163, 177, 178], "normalis": 156, "normalize_tim": 18, "normalizeobserv": [14, 18, 20, 155, 156], "normalizereward": [14, 19, 20, 155], "normalizex": 156, "north": [154, 173], "notabl": [155, 156, 166], "note": [1, 5, 9, 13, 14, 17, 18, 131, 132, 136, 137, 139, 140, 141, 142, 144, 147, 154, 158, 160, 162, 166, 169, 174, 177, 178], "notebook": [1, 155, 165, 166, 167, 169, 170, 173, 174, 175, 177, 178], "noth": [3, 128, 129, 156, 159, 177], "notic": 156, "notif": 156, "notimplementederror": 8, "nov": 154, "now": [2, 127, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 159, 163, 165, 166, 169, 173, 174, 175, 177], "np": [2, 5, 6, 7, 9, 10, 12, 13, 14, 16, 18, 19, 129, 133, 140, 141, 154, 155, 156, 159, 161, 163, 165, 167, 169, 173, 174, 175, 177, 178], "np_random": [2, 5, 9, 10, 11, 12, 15, 155, 156, 159, 165], "np_random_se": [2, 10, 11, 12, 15, 156], "nrow": [153, 175, 178], "nstep": 156, "num": [14, 17, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "num_col": 4, "num_edg": 6, "num_env": [4, 10, 11, 12, 13, 14, 132, 156, 159, 178], "num_episod": 163, "num_eval_episod": 161, "num_nod": 6, "num_training_episod": 161, "number": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 16, 17, 18, 20, 128, 129, 131, 136, 139, 140, 141, 146, 147, 148, 150, 153, 155, 156, 158, 159, 161, 162, 163, 165, 169, 175, 177, 178], "numer": [142, 143, 150, 155, 156, 161, 167, 177], "numpi": [2, 5, 7, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 155, 156, 159, 161, 163, 165, 167, 169, 173, 174, 175, 177, 178], "numpytotorch": [14, 17, 20, 156], "nv": [140, 141], "nvec": 7, "nvidia": 148, "o": [17, 161, 177, 178], "o_": 166, "o_t": 166, "ob": [9, 12, 14, 16, 17, 18, 128, 154, 155, 156, 158, 159, 160, 161, 163, 167, 169, 174, 177], "obj_slidei": 144, "obj_slidex": 144, "object": [2, 5, 9, 11, 12, 13, 14, 15, 136, 144, 145, 148, 156, 158, 161, 174, 177], "obs0": 18, "obs1": 18, "obs2": 18, "obs3": 18, "obs4": 18, "obs_kei": 18, "obs_shap": 178, "obs_space_dim": 177, "obs_t": 9, "obs_tp": 9, "obs_tp1": 9, "observ": [2, 3, 4, 5, 6, 9, 10, 11, 12, 13, 15, 17, 19, 20, 148, 155, 156, 157, 160, 162, 163, 166, 167, 173, 175, 177], "observation_mod": [11, 12], "observation_spac": [2, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 18, 158, 159, 165, 167, 173, 175, 177], "observation_structur": [137, 138, 139, 140, 141, 143, 146, 147], "observationwrapp": [14, 15, 18, 165, 169], "obstacl": 159, "obstructview": 156, "obstyp": [2, 3, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 156, 177], "obswrapp": 155, "obtain": [15, 17, 135, 150, 166], "obviou": 166, "obvious": 156, "occur": [2, 10, 131, 132, 165, 178], "octob": 136, "odyse": 169, "off": [17, 128, 129, 151, 152, 154, 155, 156, 158, 159, 173, 175], "offer": 148, "offici": 3, "offlin": [148, 156], "offscreen": [155, 156], "offset": [129, 140, 141], "offworld": 148, "often": [2, 5, 148, 156, 163, 165, 175], "oftentim": 165, "old": [10, 16, 136, 155, 156, 157], "old_epsilon": 163, "old_po": 159, "old_spac": 14, "old_throughput": 9, "older": [136, 156, 160], "oldv21env": 160, "oldv26env": 160, "oleg": [126, 127, 128, 129], "olimoyo": 155, "olipinski": [155, 156], "omar": 156, "omega_1": 142, "omega_2": 142, "omesa": 136, "omg": 148, "omit": [137, 138, 139, 140, 141, 146, 147], "omniisaacgymenv": 148, "omnivers": 148, "onc": [1, 17, 154, 155, 159, 160, 163, 165, 174, 178], "one": [2, 5, 6, 7, 8, 9, 11, 15, 16, 131, 132, 133, 134, 135, 136, 137, 139, 142, 143, 146, 150, 154, 155, 156, 159, 161, 163, 166, 167, 169, 174, 175, 177, 178], "oneof": [5, 6, 8, 13, 156], "ones": [14, 130, 155, 163, 174, 178], "ongo": 178, "onli": [2, 4, 5, 6, 7, 8, 9, 10, 17, 18, 131, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 145, 146, 147, 154, 155, 156, 159, 160, 161, 165, 167, 169, 173, 174, 175, 178], "onlin": [140, 141, 150, 151, 152, 160], "onward": 166, "op": [17, 156], "open": [1, 17, 136, 148, 155, 156, 158, 165], "openai": [2, 19, 126, 155, 156, 157, 166, 174, 177], "opencv": [14, 17, 18, 20, 155], "opengl": [136, 156], "openmodelica": 148, "oper": [8, 14, 136, 148, 155], "oppon": 159, "opportun": 148, "opt": 169, "optim": [13, 14, 17, 127, 129, 140, 141, 148, 156, 158, 159, 160, 163, 174, 175, 177, 178], "optimis": [10, 148, 155, 171], "optimist": 163, "option": [2, 3, 4, 5, 6, 7, 10, 11, 12, 14, 15, 18, 128, 131, 132, 133, 134, 135, 136, 148, 155, 156, 158, 159, 160, 165], "ord": [9, 159, 165], "order": [4, 5, 6, 15, 17, 129, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 162, 165, 175], "order_enforc": [4, 165], "ordereddict": 156, "orderenforc": [4, 15, 17, 20, 127, 128, 129, 131, 132, 133, 134, 135, 155, 156, 158, 159, 165], "orderli": 155, "org": [10, 11, 12, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 156, 174, 177, 178], "orient": [129, 137, 140, 141], "origin": [8, 10, 14, 16, 17, 18, 128, 131, 132, 136, 142, 155, 156, 158, 159, 160, 163, 169], "orsini": 155, "osmesa": 136, "other": [14, 16, 20, 129, 135, 136, 138, 140, 142, 146, 147, 153, 154, 155, 156, 158, 160, 161, 163, 165, 167, 169, 171, 174, 175, 177, 178], "otherwis": [2, 4, 6, 7, 9, 11, 12, 14, 17, 18, 139, 155, 156, 159, 174, 175], "our": [156, 158, 159, 160, 163, 165, 169, 174, 175, 178], "out": [2, 3, 13, 14, 15, 148, 155, 156, 165, 166, 167, 171, 177], "outcom": [150, 175], "outer": 131, "outermost": 14, "outlin": [150, 155, 158, 159, 163, 174], "output": [1, 9, 10, 13, 14, 17, 155, 156, 158, 159, 165, 174, 177, 178], "output_truncation_bool": 9, "outsid": [2, 14, 18, 128, 129, 155, 156, 159, 166], "outweigh": 156, "over": [5, 9, 13, 17, 138, 140, 150, 153, 155, 156, 158, 161, 163, 167, 169, 173, 174, 178], "overal": 156, "overcom": 175, "overfit": [169, 178], "overflow": 156, "overhaul": 156, "overhead": 129, "overrid": [4, 11, 14, 156, 167], "overview": 177, "overwrit": [16, 18, 19], "overwritten": [15, 155, 156], "own": [11, 15, 148, 156, 158, 160, 161, 163, 167, 168, 169, 170], "p": [138, 148, 151, 152, 153, 154, 155, 175, 178], "p_": [144, 145], "p_0": 148, "pace": 148, "packag": [1, 10, 17, 126, 136, 148, 155, 156, 159, 175], "package_data": 155, "pad": [18, 129, 156], "padding_typ": [18, 156], "page": [16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 156, 158, 159, 160, 162, 163, 171], "painlessli": 5, "pair": [136, 140, 141, 163], "palett": 177, "pan": 144, "panda": [148, 175, 177], "paper": [131, 142, 148, 156, 161, 162], "paradigm": 2, "parallel": [10, 11, 12, 14, 148, 156, 159, 161, 162, 178], "param": [3, 7, 9, 156, 175], "paramet": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 160, 163, 165, 167, 173, 177, 178], "parameter": [2, 177, 178], "parameter_tun": 155, "parametr": [5, 177], "parent": [13, 173], "pars": 4, "parse_env_id": 4, "parser": 156, "part": [17, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 159, 166, 169, 175], "parti": [136, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 165], "partial": [2, 148, 155, 156, 159], "particular": [5, 6, 9, 10, 20, 129, 156, 158, 162, 166, 169, 175], "particularli": [9, 17, 18, 132, 156, 159], "pass": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 128, 137, 138, 139, 140, 141, 146, 147, 155, 156, 158, 159, 160, 165, 167, 178], "passeng": [154, 173], "passenger_loc": 154, "passidx": 154, "passiv": [17, 20, 155, 156], "passiveenvcheck": [4, 15, 17, 20, 127, 128, 129, 131, 132, 133, 134, 135, 156, 158, 159], "past": [14, 18, 19, 155], "patch": [155, 174], "path": [4, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 156, 159, 161, 165, 173, 178], "pathlib": 173, "patienc": [155, 163], "pattern": [160, 161], "paulmest": 156, "paw": 138, "pcg64": 155, "pd": [175, 177], "pdf": [131, 150, 151, 152], "peg": 155, "pelvi": [140, 141], "penal": [137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 167], "penalis": [133, 134], "penalti": [154, 159], "pend": [11, 155], "pendulum": [11, 12, 18, 130, 131, 132, 136, 155, 158, 177], "pendulumenv": 135, "per": [7, 9, 10, 17, 129, 132, 154, 155, 162, 163, 166, 169, 173, 178], "percentag": [128, 174], "peretz": 156, "perez": 156, "perf_count": 155, "perfect": [158, 159, 163], "perfectli": 165, "perform": [2, 5, 14, 17, 145, 155, 156, 158, 161, 162, 163, 169, 173, 177], "period": 139, "perman": [144, 145], "permiss": [155, 156], "perpendicular": [151, 152, 153, 175], "perpendicularli": 142, "person": 131, "perspect": 148, "perturb": [137, 138, 139, 140, 141, 142, 143, 146, 147], "pet": 158, "pettingzoo": [2, 148, 155], "pge": 148, "phase": [148, 159, 178], "phd": [133, 134, 146], "philosoph": 9, "photorealist": 148, "phys2d": 17, "physic": [2, 126, 136, 142, 143, 144, 145, 148, 155, 156, 159, 177], "pi": [129, 131, 133, 135], "pick": [154, 163, 169, 173, 174, 175, 178], "pickl": [1, 13, 155, 156], "pickled_env_spec": 156, "pickup": [154, 173], "pictur": [158, 161], "piec": 165, "pierrecounath": 156, "pierremardon": 156, "pierr\u00e9": [156, 175], "pinocchio": 148, "pip": [1, 126, 130, 136, 155, 156, 158, 160, 165, 169], "pip3": 155, "pipe": [11, 155], "pipx": 165, "pirata": 155, "pitfal": 127, "pix_square_s": 165, "pixel": [2, 18, 128, 148, 158, 160, 165], "pixelobservationwrapp": [18, 155, 156], "pixelobswrapp": 155, "pixels3d": 165, "pkuderov": 156, "place": [9, 17, 132, 133, 134, 156, 159, 165, 178], "plai": [9, 128, 148, 155, 156, 158, 159, 163, 174], "plan": [148, 155, 156, 159], "plateau": 163, "platform": 148, "playablegam": 9, "player": [148, 150, 151, 152, 153, 154, 163, 174, 175], "player_count": 174, "player_sum": 163, "playfield": 128, "playplot": [9, 156], "pleas": [2, 5, 7, 18, 136, 148, 155, 156, 159, 163, 171], "plot": [1, 9, 161, 163, 173, 174, 175], "plot_nam": 9, "plot_q_values_map": 175, "plot_states_actions_distribut": 175, "plot_steps_and_reward": 175, "plot_surfac": 174, "plotter": 9, "plt": [161, 163, 173, 174, 175, 177, 178], "plu": [7, 151, 152, 156, 161, 163], "plugin": [155, 156], "pm": 129, "png": [169, 173], "point": [4, 8, 9, 15, 127, 128, 129, 131, 132, 135, 136, 145, 150, 155, 156, 159, 166], "pointless": 156, "pole": [2, 130, 136, 142, 143, 148, 158, 177], "pole2": 142, "pole_angl": 158, "pole_angular_veloc": 158, "poli": 148, "polici": [2, 14, 18, 19, 130, 136, 137, 138, 139, 140, 141, 146, 147, 148, 155, 156, 157, 158, 161, 163, 166, 169, 175, 178], "policy_grid": 174, "policy_mean_net": 177, "policy_network": 177, "policy_stddev_net": 177, "polygon": 155, "pomdp": 3, "pong": [17, 156, 160], "pontryagin": 129, "pool": [17, 146], "poorli": 159, "pop": [2, 155, 156], "pop_fram": 17, "popular": [14, 17, 126, 148, 156, 163, 174], "pose": 148, "posit": [2, 6, 7, 8, 9, 11, 13, 17, 127, 128, 129, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 151, 152, 153, 154, 156, 158, 159, 165, 167, 174], "position_fingertip": 145, "position_target": 145, "possibl": [2, 5, 6, 7, 8, 14, 16, 17, 129, 131, 132, 133, 134, 136, 138, 140, 143, 146, 151, 152, 153, 154, 155, 156, 158, 159, 161, 163, 165, 169, 173, 174, 175], "possibli": [7, 13, 15, 17, 159, 178], "post": [155, 156, 160, 175], "postprocess": 175, "potenti": 156, "pow": 178, "power": [17, 128, 129, 134, 142, 143, 148, 177], "pp": 154, "ppo": 171, "pprint": [14, 156], "pprint_registri": [2, 4, 156, 158, 159], "pr": [140, 148, 155, 156], "practic": [148, 155, 158, 160, 163, 166, 173, 174], "practition": 161, "pre": [4, 5, 153, 156, 165], "precis": [6, 155], "predefin": 165, "predict": [139, 148, 163, 177, 178], "predominantli": 3, "prefix": 161, "preload": 153, "premad": 148, "prematur": 2, "prepend": [9, 17], "preprocess": [9, 17, 20, 155, 156], "present": [131, 148, 155, 161, 166, 174], "preserv": [160, 166], "press": [7, 9, 128, 131, 158], "pressur": 159, "pretti": [4, 156, 175], "prevent": [3, 7, 11, 155, 156, 158, 159, 160, 173], "previou": [17, 156, 166, 167], "previous": [4, 9, 18, 137, 138, 139, 140, 141, 143, 146, 147, 155, 156], "primarili": [148, 156], "primaryclass": 156, "principl": 129, "print": [4, 156, 158, 159, 161, 163, 165, 167, 169, 173, 175, 177, 178], "print_registri": 4, "prior": 4, "priori": 148, "privat": 165, "prng": [2, 5, 6, 7], "proabil": [151, 152], "prob": [177, 178], "proba_frozen": 175, "probabl": [5, 6, 7, 16, 20, 151, 152, 153, 154, 156, 160, 163, 166, 174, 175, 177, 178], "problem": [17, 129, 132, 135, 137, 140, 141, 142, 143, 146, 148, 150, 154, 156, 157, 158, 160, 162, 163, 166, 169, 173, 178], "procedur": 177, "proceed": 131, "process": [9, 10, 11, 13, 14, 18, 131, 148, 156, 158, 165, 166, 178], "process_ev": 9, "produc": [2, 17, 20, 155, 156, 165], "product": [6, 7, 177], "program": [10, 11, 12, 148, 156], "progress": [6, 9, 156, 159, 161, 163, 178], "project": [9, 148, 155, 156, 159, 160, 161, 165, 174], "prompt": 156, "propag": 175, "proper": [155, 158], "properli": [1, 5, 155, 158, 159, 160, 169], "properti": [2, 5, 10, 11, 12, 14, 15, 18, 19, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 166], "proport": 178, "propos": [16, 156], "protocol": 17, "prototyp": 148, "prove": 148, "prover": 148, "provid": [2, 5, 6, 7, 9, 10, 11, 14, 16, 17, 18, 20, 126, 127, 131, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 158, 159, 160, 161, 162, 163, 165, 171, 173, 174], "psc": 155, "pseudo": [155, 156, 178], "pseudorandom": [5, 7], "publicli": 156, "publish": 156, "pull": [18, 19, 155], "pump": 165, "pure": 163, "purpos": [3, 5, 155, 160, 161], "push": [129, 132, 136, 142, 143, 148, 156, 158, 177], "pusher": [136, 156], "pusher_v5": 144, "put": [155, 165, 175], "puzzl": 148, "py": [1, 9, 126, 127, 128, 129, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 151, 152, 155, 156, 165, 166, 167, 169, 173, 174, 175, 177, 178], "pybullet": 148, "pycharm": 156, "pydoc": 155, "pyflyt": [148, 156], "pygam": [2, 9, 126, 155, 156, 165], "pyglet": 155, "pypi": [155, 156], "pyplot": [161, 163, 173, 174, 175, 177, 178], "pyproject": 165, "pyright": [2, 155, 156], "pystk2": 148, "python": [1, 17, 126, 127, 128, 129, 148, 155, 156, 157, 158, 159, 160, 165, 166, 167, 169, 170, 171, 173, 174, 175, 177, 178], "pytorch": [14, 17, 20, 156, 162, 171, 177], "q": [154, 161, 166, 170, 171, 173, 176, 178], "q_": 166, "q_tabl": 173, "q_target": 166, "q_updat": 175, "q_valu": [154, 163, 174], "qfrc_actuat": [140, 141], "qfrc_constraint": 142, "qgallouedec": 156, "qlearn": 175, "qpo": [136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "qtabl": 175, "qtable_best_act": 175, "qtable_direct": 175, "qtable_directions_map": 175, "qtable_val_max": 175, "quad": 141, "quad_ctrl_cost": 141, "quad_impact_cost": 141, "quadcopt": 148, "quadrotor": 148, "quadrup": [136, 137, 156, 168, 170], "quagla": 155, "qualiti": [10, 148, 156], "quaternion": [137, 140, 141], "queen": 150, "question": [148, 160, 165], "queue": [11, 161], "quicker": 178, "quickli": [133, 148, 163, 174, 175], "quit": [11, 156, 165], "qvel": [136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "qwop": 148, "r": [1, 7, 14, 17, 19, 131, 135, 148, 150, 151, 152, 154, 161, 167, 169, 173, 175, 177], "r_": 178, "r_elbow_flex_joint": 144, "r_forearm_roll_joint": 144, "r_shoulder_lift_joint": 144, "r_shoulder_pan_joint": 144, "r_t": 166, "r_upper_arm_roll_joint": 144, "r_wrist_flex_joint": 144, "r_wrist_roll_joint": 144, "race": [126, 148, 155], "racecar": 148, "racecar_gym": 148, "racing_dream": 148, "rad": [131, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147], "radian": [129, 131, 132, 135, 143], "rafaelcp": 156, "raghuspacerajan": 155, "rainbow": [171, 177], "raini": 156, "rais": [2, 4, 7, 8, 9, 11, 12, 13, 15, 17, 18, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 178], "ram": 162, "rand": 155, "randint": [155, 173], "randn": 155, "random": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 17, 18, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 145, 146, 147, 153, 154, 155, 156, 158, 159, 161, 163, 165, 173, 174, 175, 177], "randomize_domain": 178, "randomize_ob": 128, "randomli": [5, 6, 9, 129, 153, 155, 156, 158, 159, 163, 165, 175, 178], "randomnumbergener": 155, "randomst": 155, "rang": [7, 9, 13, 14, 16, 17, 18, 20, 127, 130, 131, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 163, 165, 167, 169, 170, 172, 173, 174, 175, 176, 177, 178], "rangefind": 127, "raphajan": 156, "rapidli": 148, "rare": [7, 155], "rate": [144, 145, 148, 161, 163, 174, 175, 177, 178], "rather": [2, 4, 6, 128, 155, 156, 161, 174, 178], "raw": [156, 159, 161, 169], "rayerdyn": 156, "rcparam": 177, "rdnfn": 155, "re": [1, 155, 156, 158, 160, 161, 163, 165, 173, 175, 177], "reach": [2, 4, 17, 18, 20, 130, 131, 132, 133, 134, 136, 148, 151, 152, 153, 154, 156, 159, 160, 165, 166, 171, 174, 175, 177], "reachabl": 154, "reacher": [136, 156, 167], "reacher_weighted_reward": 165, "reacherrewardwrapp": 167, "read": [2, 5, 10, 13, 19, 131, 137, 140, 141, 155, 156, 159, 163], "read_from_shared_memori": [5, 13], "readabl": [5, 6, 156, 159], "reader": [162, 169], "readi": [158, 169, 174], "readm": [155, 156, 165], "readthedoc": 18, "real": [9, 138, 148, 158, 173], "realist": [136, 148], "realli": [156, 159, 169, 174], "rear": 128, "reason": [2, 17, 129, 148, 155, 156, 159, 160, 169], "rebuild": 1, "receiv": [9, 18, 19, 20, 128, 129, 134, 147, 154, 155, 157, 158, 163, 166, 174, 177, 178], "recent": [13, 14, 17, 18, 19, 156, 161], "recent_reward": 161, "recogn": 156, "recommend": [3, 4, 9, 11, 17, 129, 136, 137, 140, 141, 155, 156, 159, 169, 174, 178], "reconstruct": 158, "record": [4, 9, 17, 20, 127, 148, 155, 156, 158, 160, 163, 177, 178], "recordconstructorutil": 156, "recorded_fram": 156, "recordepisodestat": 155, "recordepisodestatist": [14, 17, 20, 155, 156, 161, 163, 174, 177, 178], "recordvideo": [17, 20, 155, 156, 161], "recordvideov0": 156, "recreat": 156, "recreated_env": 156, "rect": 165, "red": [154, 155, 165, 173], "redirect": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125], "redtachyon": [155, 156], "reduc": [132, 148, 162, 163, 171, 173, 174, 178], "redund": 155, "refactor": [155, 156], "refer": [2, 4, 5, 7, 9, 136, 156, 157, 162, 165, 166, 169], "referenc": 156, "reflect": [18, 132, 155, 156], "refresh": 175, "regard": 130, "regardless": [137, 138, 139, 140, 141, 146, 147, 169], "regex": 4, "reginald": 156, "regist": [13, 155, 156], "register_env": [17, 156, 160], "registr": [4, 155, 156, 165], "registri": [4, 155, 156], "regress": [9, 156], "regularli": 156, "reinforc": [2, 5, 131, 146, 148, 149, 150, 151, 152, 154, 155, 156, 157, 162, 166, 170, 171, 173, 174, 175, 176, 178], "reiniti": [155, 177], "rel": [131, 140, 141, 156, 165, 167, 178], "relat": [129, 132, 137, 139, 140, 141, 142, 143, 144, 145, 147, 148, 156, 177], "relative_posit": 165, "relativeposit": [165, 167], "releas": [10, 11, 12, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 165], "relev": [155, 165], "reli": 136, "reliabl": 163, "relu": [14, 178], "remain": [18, 151, 152, 155, 160, 165, 166], "remak": 178, "rememb": [17, 128, 163, 165, 167], "remind": [156, 169, 173], "remot": [148, 156], "remov": [2, 4, 17, 18, 137, 138, 139, 140, 141, 145, 146, 147, 154, 155, 156], "renam": [14, 17, 18, 138, 140, 155, 156, 177], "render": [2, 3, 4, 10, 14, 15, 17, 18, 20, 126, 127, 137, 138, 139, 140, 146, 147, 148, 155, 156, 158, 161, 167, 174, 175], "render_clos": 3, "render_fp": [2, 9, 17, 156, 165], "render_imag": 3, "render_init": 3, "render_kei": 18, "render_mod": [2, 3, 9, 10, 15, 17, 18, 127, 128, 131, 132, 133, 134, 135, 136, 155, 156, 157, 158, 159, 160, 161, 165, 169, 175, 178], "render_onli": 18, "render_st": 3, "rendercollect": [2, 17, 20, 156], "renderedfram": [17, 20], "renderfram": [2, 9, 10, 14, 15], "renderstatetyp": 3, "renorm": 129, "rep": 175, "repeat": [4, 16, 18, 20, 156, 158, 159, 163, 175], "repeat_action_dur": 16, "repeat_action_prob": 16, "repeatedli": 158, "rephras": 155, "replac": [17, 18, 137, 146, 150, 155, 156, 158, 161, 163, 165, 169, 174], "replay_buff": 156, "repo": [1, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156], "report": [127, 137, 140, 141, 155, 156, 160], "repositori": [136, 155, 171], "repres": [2, 6, 7, 9, 18, 129, 131, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 153, 154, 155, 156, 157, 158, 159, 165, 169, 175, 177], "represent": [2, 156, 166], "reproduc": [2, 6, 148, 156, 159, 160, 173, 175], "request": [18, 150, 156], "requir": [1, 2, 5, 6, 9, 11, 14, 18, 136, 147, 155, 156, 159, 162, 163, 165, 169, 174, 177, 178], "rerun": 156, "res_al": 175, "rescal": [14, 16, 18, 20, 158], "rescale_act": 155, "rescaleact": [14, 15, 16, 20, 156, 158], "rescaleobserv": [14, 18, 20, 156], "research": [136, 142, 148, 154, 156, 160, 162], "reseed_sampl": 156, "reseed_valu": 156, "reset": [2, 3, 4, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 146, 147, 151, 152, 153, 154, 155, 156, 157, 158, 161, 163, 169, 173, 174, 175, 177, 178], "reset_async": 156, "reset_clean": 17, "reset_noise_scal": [137, 138, 139, 140, 141, 142, 143, 146, 147, 169], "reset_qt": 175, "reset_wait": 156, "resetneed": 17, "reshap": [14, 18, 20, 175], "reshape_env": 18, "reshapeobserv": [14, 18, 20], "resiz": [14, 17, 18, 20, 156], "resized_env": 18, "resizeobserv": [14, 18, 20, 156], "resolv": 155, "resourc": [10, 11, 12, 159, 160, 165, 174], "respect": [14, 15, 17, 129, 131, 137, 138, 139, 140, 141, 146, 147, 155, 156, 158, 167, 178], "respectivesli": 14, "respond": [158, 174], "rest": [128, 129, 139, 147, 156, 159, 178], "restart": 158, "restor": [137, 138, 139, 140, 141, 146, 147, 163], "restrict": 156, "result": [2, 6, 8, 11, 12, 13, 17, 129, 131, 132, 136, 137, 140, 141, 142, 145, 149, 151, 152, 154, 155, 156, 158, 159, 160, 161, 174, 175, 178], "retriev": 4, "retro": [148, 156], "return": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 127, 136, 137, 138, 139, 140, 141, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 158, 159, 160, 163, 165, 166, 167, 173, 174, 175, 177, 178], "return_info": [2, 155], "return_queu": [14, 17, 161, 163, 174, 177, 178], "reveal": [150, 161], "revers": [5, 8, 150, 177, 178], "revert": [155, 156], "revisit": 17, "rew": [9, 14, 17, 19, 166], "reward": [2, 3, 4, 9, 10, 11, 12, 15, 17, 18, 20, 148, 155, 156, 157, 158, 160, 161, 163, 165, 166, 167, 173, 174, 175, 177, 178], "reward_al": 140, "reward_control": [144, 145], "reward_control_weight": [144, 145], "reward_ctrl": [14, 137, 139, 140, 144, 145, 147, 167], "reward_ctrl_weight": 167, "reward_dist": [144, 145, 167], "reward_dist_weight": [144, 145, 167], "reward_forward": [137, 138, 139, 140, 146, 147], "reward_fwd": 146, "reward_linvel": 140, "reward_moving_averag": [163, 174], "reward_near": 144, "reward_near_weight": [144, 145], "reward_over_episod": 177, "reward_quadctrl": 140, "reward_rang": 156, "reward_run": [14, 138], "reward_scal": 159, "reward_surv": [137, 139, 140, 142, 143, 147], "reward_threshold": [4, 137, 138, 139, 140, 141, 144, 145, 146, 147, 156, 165], "rewards_df": 175, "rewards_over_se": 177, "rewardtyp": [3, 156], "rewardwrapp": [14, 15, 19, 169], "rewrit": [155, 156], "rgb": [2, 14, 17, 18, 20, 128, 137, 138, 139, 140, 146, 147, 155, 156, 158], "rgb_arrai": [2, 3, 9, 17, 18, 20, 127, 128, 131, 132, 133, 134, 135, 136, 155, 156, 158, 160, 161, 165, 169, 175, 178], "rgb_array_list": [2, 9, 17, 155], "rgbd": 156, "rgbd_tupl": 136, "richard": 175, "ride": [158, 163], "right": [2, 7, 127, 128, 129, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 146, 147, 151, 152, 153, 154, 156, 158, 159, 163, 165, 173, 174, 175, 177], "right_back_leg": 137, "right_elbow": [140, 141], "right_foot": [140, 141], "right_hip_i": [140, 141], "right_hip_x": [140, 141], "right_hip_z": [140, 141], "right_kne": [140, 141], "right_lower_arm": [140, 141], "right_shoulder1": [140, 141], "right_shoulder2": [140, 141], "right_sin": [140, 141], "right_thigh": [140, 141], "right_upper_arm": [140, 141], "rigid": [140, 141], "risk": 148, "riski": 148, "rl": [9, 17, 148, 156, 157, 159, 160, 161, 163, 166, 169, 170, 172, 174, 176, 177], "rlbook2020": [150, 151, 152], "rmsprop": 178, "rnd": [155, 156], "rng": [2, 3, 5, 6, 7, 9, 10, 155, 156, 165, 175], "road": [128, 156], "roadmap": 156, "robertoschiavon": 156, "robo": 148, "robot": [127, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 160, 166, 168, 170], "robust": [148, 173, 178], "rocket": [129, 148], "rodrigo": 156, "rodrigodelazcano": [155, 156], "rogerjl": 156, "rohan138": 155, "roll": [18, 20, 144, 174], "rolling_length": [163, 174, 178], "rollout": [154, 156], "rom": [155, 156], "ronald": 177, "root": [6, 137, 140, 141, 156], "rooti": [138, 139, 147], "rootx": [138, 139, 147], "rootz": [138, 139, 147], "rotat": [129, 131, 137, 140, 141, 144, 155, 174], "rotor": [137, 138, 139, 140, 141, 146, 147], "roughli": 136, "roulett": 155, "roundtrip": 17, "row": [151, 152, 153, 159, 163, 175], "rpg": 153, "rr": 156, "rstride": 174, "rule": [148, 150, 159, 163, 174], "run": [1, 2, 4, 10, 11, 12, 14, 17, 18, 19, 127, 129, 131, 136, 137, 138, 139, 140, 146, 147, 148, 151, 152, 155, 156, 158, 160, 161, 162, 165, 169, 178], "run_": 1, "run_env": 175, "run_gymnasium_env": 165, "runner": 136, "running_g": 177, "runningmeanstd": [14, 18, 19], "runtim": 178, "runtimeerror": [11, 12, 178], "rushivarora": 155, "rusu24edward": [155, 156], "ryanrud": 155, "r\u00e9mi": 146, "s_": 178, "sab": [150, 163, 174], "safe": [129, 148, 156, 158], "safeti": [148, 155, 156, 159], "sai": [17, 155, 163, 167], "said": [3, 140], "same": [4, 5, 6, 8, 9, 10, 11, 12, 13, 14, 16, 18, 20, 127, 128, 131, 136, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 154, 155, 156, 159, 160, 162, 163, 166, 169, 174, 178], "sampl": [2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 17, 18, 19, 129, 144, 154, 155, 156, 157, 158, 160, 161, 162, 163, 165, 169, 174, 175, 177, 178], "sample_act": 177, "sample_mask": 6, "sample_n": 5, "sample_phas": 178, "samplefactori": 156, "sander": 156, "saniti": 175, "sarsa": 163, "sashashura": [155, 156], "satisfi": 2, "satur": 148, "save": [14, 17, 155, 156, 158, 161, 163, 167, 173, 175], "save_logg": 9, "save_video": [9, 155], "save_videos1": 17, "save_videos2": 17, "save_videos3": 17, "save_weight": 178, "savefig": 173, "savefig_fold": 173, "sb3": 155, "scalabl": 148, "scalar": [7, 14, 16, 155], "scale": [14, 17, 18, 19, 129, 137, 138, 139, 140, 141, 142, 143, 146, 147, 148, 156, 162, 178], "scale_and_shift": 14, "scale_ob": 17, "scenario": [128, 148, 161, 173], "scene": [2, 148, 156, 169], "sched": 148, "schedul": [9, 148, 153], "scheme": 128, "schulhoff": 156, "schulman": [137, 178], "scienc": 163, "scope": [2, 166], "score": [127, 129, 158, 159], "scoreboard": 155, "scratch": [177, 178], "screen": [17, 137, 138, 139, 140, 146, 147, 155, 156, 158], "screen_siz": 17, "script": [1, 148, 161, 174], "sdl": 156, "seaborn": [174, 175, 177], "search": 156, "sebastian": 156, "second": [1, 6, 9, 10, 17, 129, 132, 142, 145, 146, 148, 156, 161, 162, 169], "section": [16, 128, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 160, 165, 174, 175], "see": [1, 2, 5, 6, 9, 10, 11, 12, 17, 128, 129, 131, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 151, 152, 153, 155, 156, 158, 159, 160, 161, 163, 165, 169, 175, 178], "seed": [2, 3, 4, 5, 6, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 131, 132, 133, 134, 135, 136, 155, 156, 157, 158, 159, 161, 165, 173, 175, 177, 178], "seeded_valu": 156, "seem": [158, 175], "seen": [131, 159], "segment": 146, "select": [5, 7, 9, 136, 156, 158, 169, 173, 178], "select_act": 178, "self": [5, 6, 7, 9, 14, 18, 19, 134, 148, 156, 159, 163, 165, 167, 174, 175, 177, 178], "semant": 155, "send": 14, "sens": [7, 159, 169, 175], "sensor": [128, 169], "sent": 155, "separ": [5, 17, 156, 159, 160, 165, 178], "sepsi": 148, "sequenc": [2, 4, 5, 6, 7, 8, 11, 12, 13, 14, 18, 148, 155, 156, 158, 159], "sequenti": [161, 177, 178], "seri": [6, 158], "serial": [12, 178], "serv": [3, 5, 137, 138, 139, 140, 141, 146, 147, 161], "server": 156, "set": [2, 4, 5, 6, 7, 9, 10, 11, 12, 15, 16, 17, 18, 20, 126, 129, 130, 131, 133, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 153, 155, 156, 159, 160, 161, 165, 166, 167, 169, 171, 173, 174, 175, 177, 178], "set_attr": [11, 12, 156], "set_color": 175, "set_linewidth": 175, "set_mod": 165, "set_np_random_through_se": [2, 10], "set_rotate_label": 174, "set_stat": 155, "set_them": 175, "set_titl": [163, 174, 175, 178], "set_vis": 175, "set_wrapper_attr": [15, 156], "set_xlabel": [163, 174, 178], "set_xtick": 175, "set_xticklabel": 174, "set_ylabel": [163, 174], "set_yticklabel": 174, "set_zlabel": 174, "setup": [155, 161, 173], "seungjaeryanle": 155, "seven": 147, "sever": [2, 4, 7, 10, 17, 129, 155, 156, 158, 159, 161, 173, 175], "sfff": 153, "sfffffff": 153, "shape": [2, 5, 6, 7, 8, 10, 11, 13, 14, 16, 17, 18, 20, 131, 132, 133, 134, 135, 137, 140, 141, 150, 151, 152, 153, 154, 155, 156, 158, 159, 165, 167, 175, 177, 178], "share": [5, 11, 156, 161, 177], "shared_featur": 177, "shared_memori": [11, 13], "shared_net": 177, "sheet": 163, "shen": 156, "shift": 7, "shimmi": [156, 160], "shin": [138, 140, 141], "shinrl": 148, "shoot": 11, "short": [136, 155, 160, 163], "shorthand": 155, "should": [1, 2, 5, 7, 9, 10, 11, 12, 13, 14, 17, 136, 145, 155, 156, 158, 159, 162, 163, 165, 166, 167, 169, 174, 178], "shoulder": 144, "shouldn": [156, 159, 165], "show": [3, 136, 150, 155, 156, 158, 160, 161, 163, 165, 167, 169, 170, 172, 173, 174, 175, 176, 177, 178], "showcas": [164, 168, 170, 174], "shown": [128, 131, 166], "shrink_act": 14, "siddarth": [156, 177], "side": [13, 129, 175], "sign": [142, 143, 177], "signal": [2, 17, 137, 139, 140, 147, 154, 158, 165, 166, 175], "signific": [148, 156, 160, 161, 169], "significantli": [155, 156, 173, 178], "silenc": 9, "silent": 156, "silver": [175, 178], "sim": [148, 175], "similar": [6, 10, 144, 155, 156, 159, 165], "similarli": [129, 156], "simlat": 136, "simonini": 175, "simoninithoma": 175, "simpl": [127, 148, 149, 157, 158, 160, 161, 163, 166, 177], "simplegrid": 148, "simpler": 158, "simplest": 178, "simpli": [14, 16, 17, 18, 19, 165], "simplic": 148, "simplifi": [135, 155, 156], "simplist": 165, "simul": [2, 136, 140, 141, 142, 143, 148, 156, 159, 174, 175, 177], "simultan": [156, 159], "sin": [129, 135, 142, 145], "sinc": [5, 14, 17, 126, 132, 141, 145, 154, 155, 156, 159, 165, 166, 169, 175], "sine": [131, 142, 145], "singl": [2, 3, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 18, 20, 139, 147, 148, 155, 156, 158, 159, 160, 162, 165, 174, 177], "single_action_spac": [10, 13, 14, 156, 178], "single_func": 14, "single_observation_spac": [10, 11, 14, 156, 178], "single_rgb_arrai": 155, "sinusoid": [133, 134], "site": 155, "situat": [154, 158, 163], "six": 147, "size": [5, 13, 14, 17, 148, 153, 155, 156, 159, 165, 169], "sjmikler": 156, "skeleton": 165, "skill": [159, 161], "skip": [9, 17, 18, 20, 155, 156, 160, 165], "skip_and_max_ob": 18, "skip_close_check": 9, "skip_render_check": 9, "sleep": 129, "slide": [138, 139, 142, 143, 144, 145, 146, 147], "slider": [142, 143], "slider1": 146, "slider2": 146, "slight": 127, "slightli": [9, 127, 136, 137, 140, 141, 142, 145, 163], "slime": 148, "slimevolleygym": 148, "slipperi": [151, 153], "slow": [156, 174], "slowdown": 9, "slower": [129, 163, 178], "small": [127, 148, 149, 155, 156, 159, 163, 177], "smallest": 7, "smart": 148, "smarter": 158, "smooth": [161, 163], "smoother": [155, 174], "sn": [174, 175, 177], "snake_cas": 1, "snippet": [9, 17], "snow": 153, "so": [1, 9, 11, 14, 17, 18, 20, 129, 130, 137, 138, 139, 140, 141, 144, 145, 146, 147, 151, 152, 153, 155, 156, 159, 161, 163, 165, 166, 167, 169, 174, 175, 178], "soft": 148, "softmax": 178, "softrobot": 148, "softwar": [2, 148, 156], "sokoban": 148, "sole": [155, 156], "solut": [129, 156, 174], "solv": [2, 127, 130, 132, 136, 142, 143, 148, 159, 160, 163, 165, 170, 176, 177], "some": [2, 5, 6, 7, 10, 11, 12, 14, 15, 128, 130, 131, 145, 146, 154, 155, 156, 158, 160, 161, 163, 165, 167, 169, 174, 175, 178], "someth": [155, 156, 169], "sometim": [9, 137, 151, 152, 153, 158, 159, 161, 165, 167], "sonelu": 156, "soon": [155, 165], "sophist": [159, 161], "sort": 7, "sourc": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 136, 148, 154, 155, 156, 165, 166, 167, 169, 170, 173, 174, 175, 177, 178], "south": [154, 173], "space": [2, 9, 10, 11, 12, 14, 15, 16, 17, 18, 20, 136, 148, 149, 155, 156, 163, 165, 167, 175, 177, 178], "spacecraft": 148, "spaces_kwarg": 6, "span": 17, "sparisi": 156, "spark": 148, "spars": [131, 159, 165], "spatial": 159, "spawn": [11, 145, 178], "spec": [2, 3, 4, 10, 15, 17, 156], "special": [156, 177], "specialis": 156, "specialist": 162, "specif": [2, 4, 7, 10, 14, 17, 136, 155, 156, 159, 161, 166, 177, 178], "specifi": [2, 5, 6, 7, 9, 14, 16, 17, 18, 20, 126, 127, 128, 129, 130, 135, 137, 138, 139, 140, 141, 143, 146, 147, 149, 153, 154, 155, 156, 158, 160, 161, 165, 167], "speed": [10, 127, 128, 156, 158, 160, 169, 170, 176], "speedup": 178, "spell": 155, "spent": [127, 129], "sphere": 144, "spheric": 145, "sphinx": 1, "spike": 163, "spine": 175, "spinningup": 177, "split": [147, 156], "squar": [17, 144, 145, 154, 156, 159, 165, 175, 178], "squeez": [177, 178], "st": 175, "st_all": 175, "stabil": [14, 18, 19, 140, 141, 155, 159, 163, 167, 177], "stabl": [18, 148, 155, 156, 163, 165, 171, 173], "stable_baselines3": 18, "stack": [6, 17, 18, 20, 156, 177], "stack_siz": 18, "stacked_env": 18, "stage": [17, 156, 161], "stai": [158, 159, 163, 178], "stand": [127, 136, 137, 139, 140, 141, 142, 143, 147, 156, 163, 174], "standard": [18, 19, 148, 155, 156, 157, 163, 173, 177, 178], "standard_norm": 155, "standup": 136, "stare": 161, "start": [1, 2, 5, 7, 9, 11, 13, 17, 136, 156, 157, 158, 160, 161, 163, 174, 175, 177, 178], "start_epsilon": [163, 174], "state": [2, 3, 4, 17, 18, 20, 130, 136, 148, 149, 155, 156, 158, 160, 163, 166, 169, 173, 174, 175, 177, 178], "state_dict": 178, "state_info": 3, "state_s": 175, "state_valu": [174, 178], "state_value_pr": 178, "statefulli": 3, "stateless": [3, 156], "statement": [156, 160], "statetyp": [3, 156], "stationari": 178, "statist": [9, 14, 17, 18, 19, 129, 156, 161, 173, 177], "stats_kei": [14, 17], "std": [14, 161, 163, 173, 177], "std_reward": [161, 173], "stderr": 155, "steer": [128, 159], "stefanbschneid": 156, "step": [2, 3, 4, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 127, 129, 131, 132, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 151, 152, 153, 154, 155, 156, 157, 161, 162, 166, 167, 173, 174, 175, 177, 178], "step_api_compat": 9, "step_async": 156, "step_count": 161, "step_index": 9, "step_info": 3, "step_penalti": 159, "step_return": 9, "step_starting_index": 9, "step_trigg": [9, 17], "step_wait": 156, "stepapicompat": 156, "steppabl": 148, "steps_df": 175, "stick": [150, 174], "sticki": 16, "stickyact": [16, 20, 156], "still": [9, 155, 156, 163, 167, 173, 174, 178], "stochast": [16, 130, 131, 133, 134, 136, 151, 152, 155, 175], "stock": 148, "stool": 153, "stop": [17, 150, 156, 158, 163, 166, 174], "stopiter": 13, "storag": 148, "store": [4, 9, 14, 17, 156, 173, 177], "str": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 174, 175, 177], "straightforward": 160, "strang": 156, "strateg": [133, 134, 159], "strategi": [148, 158, 159, 160, 162, 174], "strict": [2, 155, 156], "strictli": 17, "striker": 155, "string": [2, 4, 5, 7, 9, 14, 18, 155, 156, 158, 159, 165], "stringio": 2, "stronger": 169, "structur": [3, 5, 6, 8, 156, 158, 159, 165], "struggl": 161, "stump": 127, "style": [2, 4, 10, 148, 155, 156, 160, 177], "sub": [6, 10, 11, 12, 14, 156, 162], "subclass": [14, 155], "subject": 146, "submit": [148, 155], "suboptim": 163, "subplot": [163, 174, 175, 178], "subprocess": 11, "subse": 155, "subsect": 169, "subsequ": [6, 155, 160], "subset": [7, 156, 167], "subspac": [5, 6, 7, 8, 14, 18, 155], "substanti": [156, 162], "subtl": 160, "subtract": 178, "succeed": 158, "success": [131, 154, 156, 158, 159, 160, 161, 166], "successfulli": [2, 154, 158, 163, 169], "suffici": [159, 174], "suggest": [155, 163, 178], "suit": [148, 155], "suitabl": [148, 149], "sum": [6, 7, 17, 129, 150, 156, 161, 174, 175, 177], "summaris": 156, "sumo": 148, "super": [2, 14, 15, 148, 155, 159, 165, 167, 177, 178], "superclass": [5, 16, 19], "supersuit": 156, "supertuxkart": 148, "supervis": 163, "suppli": 166, "support": [2, 5, 6, 8, 9, 10, 17, 18, 20, 137, 138, 139, 140, 141, 143, 146, 147, 148, 155, 156, 158, 159, 165], "supportsfloat": [2, 7, 9, 15, 19, 167, 177], "suppos": 9, "suptitl": [174, 178], "sure": [1, 2, 9, 17, 165, 167, 169], "surfac": [142, 143, 147, 165], "surfarrai": 165, "surround": [17, 20], "survei": 162, "suspend": 146, "sutton": [2, 131, 132, 142, 143, 150, 151, 152, 155, 174, 175], "sutton_barto_reward": [132, 156], "swig": [126, 155, 156], "swim": 136, "swimmer": [136, 147, 155], "swing": [131, 135], "swingup": 135, "switch": [155, 156, 158, 160], "symbol": 148, "symptom": 163, "sync": [4, 9, 10, 12, 14, 132, 156], "synchron": [10, 11, 12, 156], "synchronizedarrai": 13, "syncvectorenv": [4, 10, 132, 156, 159, 162, 178], "syntax": 4, "synthes": 148, "synthesi": [140, 141], "system": [131, 135, 136, 142, 155, 156, 159, 165], "system_check": 6, "systemat": [161, 163], "t": [1, 2, 4, 5, 6, 8, 9, 14, 15, 17, 128, 129, 133, 134, 154, 155, 156, 158, 159, 160, 161, 163, 165, 166, 173, 174, 175, 178], "t_cov": [5, 13], "tabl": [155, 163, 173], "tabular": [148, 163, 170, 176], "tag": 148, "tai": 156, "tailkind": 9, "take": [1, 2, 3, 4, 7, 8, 9, 10, 11, 16, 17, 130, 132, 134, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 154, 155, 158, 159, 163, 167, 173, 174, 175, 177, 178], "taken": [10, 17, 18, 20, 130, 132, 158, 161, 162, 165, 171, 177, 178], "talk": [162, 163, 177], "tall": 137, "tan": 156, "tanh": [129, 177], "target": [18, 131, 136, 144, 145, 154, 159, 160, 163, 165, 166, 167, 178], "target_devic": [14, 17], "target_dur": 9, "target_i": [145, 159], "target_posit": 167, "target_x": [145, 159], "target_xp": [14, 17], "task": [2, 6, 15, 128, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 158, 159, 160, 165, 166, 167, 175, 177], "tassa": [139, 140, 141], "tau": 135, "taxi": [149, 155, 156, 170, 176], "taxi_col": 154, "taxi_row": 154, "taxi_v3_action_masking_comparison": 173, "td": [175, 178], "td3": 171, "td_error": 178, "teach": [158, 163], "team": [155, 156], "technic": [16, 156], "techniqu": [17, 20, 161, 173], "techreport": [133, 134], "tell": [158, 163, 166, 171, 174], "templat": [3, 165], "tempor": 163, "temporal_differ": [163, 174], "temporarili": [13, 163], "ten": [150, 174], "tendon": [140, 141], "tendon_length": [140, 141], "tendon_veloc": [140, 141], "tensor": [14, 17, 20, 177, 178], "term": [2, 14, 18, 130, 131, 136, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 159, 163, 165, 167, 178], "termin": [2, 3, 9, 10, 11, 12, 14, 17, 18, 19, 20, 131, 132, 133, 134, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 161, 163, 165, 167, 174, 175, 177, 178], "terminal_observ": 155, "terminal_on_life_loss": 17, "terminaltyp": [3, 156], "terminate_when_unhealthi": [137, 139, 140, 147, 169], "terminationwrapp": 169, "terrain": [127, 148, 169], "terri": 156, "terribli": 155, "test": [9, 17, 127, 148, 155, 156, 158, 161, 165, 169, 177], "test_ag": 163, "tetri": 148, "text": [2, 5, 7, 8, 13, 150, 151, 152, 153, 154, 155, 156, 158], "textencod": 155, "th": [17, 18, 20], "than": [1, 4, 6, 16, 129, 131, 132, 133, 134, 143, 144, 150, 155, 156, 158, 159, 161, 163, 169, 174, 175, 178], "thank": 156, "theden": 155, "thei": [5, 11, 17, 20, 136, 149, 150, 151, 152, 153, 155, 156, 159, 160, 162, 165, 169, 173, 178], "theirfor": 178, "them": [3, 5, 14, 15, 17, 129, 137, 138, 145, 148, 154, 155, 156, 160, 167, 169, 173, 178], "themselv": 148, "theo": 156, "theorem": 148, "theoret": [148, 155, 156, 163], "theori": [135, 142, 155, 158, 175, 178], "therefor": [2, 5, 17, 137, 140, 141, 145, 147, 155, 156, 170, 172, 176], "thesi": [133, 134, 146], "theta": [135, 155], "theta1": 131, "theta2": 131, "theta_dt": 135, "thi": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 161, 162, 163, 165, 166, 167, 169, 171, 173, 174, 175, 177, 178], "thigh": [138, 139, 140, 141, 147], "thigh_joint": [139, 147], "thigh_left_joint": 147, "thing": [13, 15, 155, 163, 167], "think": [13, 148, 158], "third": [137, 138, 139, 140, 141, 143, 146, 147, 155, 156, 165], "third_party_environ": 155, "thoma": 175, "thoroughli": 159, "those": [13, 14, 131, 155, 159, 167, 175, 178], "though": [6, 11, 155], "thought": [155, 156, 163], "thousand": [156, 161], "thousandth": 17, "thread": 156, "three": [5, 6, 15, 139, 140, 141, 146, 155, 156, 159, 165], "threshold": [4, 131, 132, 154, 165], "throttl": [129, 159], "through": [2, 3, 4, 5, 10, 11, 12, 14, 17, 18, 20, 140, 141, 148, 155, 156, 157, 158, 159, 162, 163, 166, 173], "throw": [156, 167], "thrower": 155, "thrown": 7, "thruster": 129, "thu": [11, 137, 140, 141, 142, 156, 178], "thytu": 156, "ti": 175, "tick": 165, "tight": 173, "tight_layout": [163, 174, 175, 178], "tile": [128, 153, 175], "tileset": 153, "till": [174, 178], "till2": 156, "tilleri": 153, "tilt": 129, "tim": 175, "time": [1, 2, 5, 6, 9, 10, 14, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 128, 132, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 151, 152, 154, 155, 156, 158, 159, 160, 161, 162, 163, 165, 168, 169, 170, 171, 173, 174, 177, 178], "time_limit": [153, 154], "time_queu": [14, 17, 161], "timeawareobserv": [10, 18, 20, 156, 158], "timelaps": 161, "timelimit": [2, 4, 15, 17, 20, 127, 128, 129, 131, 132, 133, 134, 135, 156, 158, 165, 166], "times10": [137, 140, 141], "timestamp": 2, "timestep": [2, 17, 18, 20, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 158, 159, 165, 169, 177, 178], "timgates42": 155, "timschneider42": 156, "tip": [138, 142, 146, 147], "tips_arm": 144, "titl": [9, 133, 134, 156, 161, 173, 174, 175, 177], "tmrl": 148, "to_json": [5, 156], "to_torch": 156, "tobirohr": 156, "toctre": 1, "todorov": [139, 140, 141], "togeth": [5, 12, 136, 160, 175], "toi": [126, 150, 151, 152, 153, 154, 155], "tom": 154, "toml": 165, "ton": 155, "too": [137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 158, 159, 169, 175], "took": 161, "tool": [137, 138, 139, 140, 141, 143, 146, 147, 148, 158, 161], "toolbox": 148, "toolkit": 148, "top": [128, 129, 130, 133, 134, 139, 142, 143, 147, 148, 155, 156, 159, 165, 175, 177], "torch": [2, 14, 17, 20, 156, 177, 178], "torqu": [127, 129, 131, 135, 137, 138, 139, 140, 141, 144, 145, 146, 147], "torso": [137, 138, 139, 140, 141, 147, 169], "toss": 7, "total": [2, 127, 128, 129, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 154, 158, 161, 163, 173, 175, 177, 178], "total_episod": 175, "total_num_episod": 177, "total_reward": [158, 163, 173, 175], "total_timestep": 156, "touch": [14, 159, 165], "touretzki": 131, "toward": [146, 155, 163], "tower": 156, "towers2024gymnasium": 156, "towers_gymnasium_2023": 156, "town": 156, "toy_text": [153, 155, 174, 175], "tpu": 162, "tqdm": [163, 174, 175, 178], "trace": [127, 156], "traceback": [13, 17], "track": [9, 14, 17, 20, 128, 132, 137, 138, 139, 140, 146, 147, 148, 156, 163, 173], "trackmania": 148, "trade": [148, 156, 158, 159], "tradeoff": 178, "traffic": 148, "train": [10, 137, 140, 141, 142, 145, 148, 155, 156, 158, 159, 160, 171, 173, 175], "train_q_learn": 173, "training_env": 160, "training_error": [163, 174], "training_error_moving_averag": [163, 174], "training_period": 161, "training_video": 161, "trajectori": [14, 18, 19, 129, 140, 141], "transfer": [14, 17, 148, 162], "transform": [3, 5, 8, 9, 14, 15, 16, 18, 19, 20, 145, 167], "transformact": [14, 16, 20], "transformob": 156, "transformobserv": [14, 18, 20], "transformreward": [14, 19, 20], "transit": [3, 9, 140, 141, 151, 152, 153, 154, 156, 157, 166, 178], "transition_info": 3, "translat": [137, 140, 141, 156, 159, 165], "transport": 148, "transpos": [9, 165], "treasur": 175, "treat": 158, "treatment": 148, "tremend": 155, "trend": 161, "tri": 156, "trial": [158, 163], "trigaten": 155, "trigger": [9, 17, 154, 161], "tristan": 156, "tristandeleu": 155, "trivial": [158, 159, 165], "true": [2, 4, 6, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 127, 128, 132, 136, 137, 138, 139, 140, 141, 146, 147, 150, 153, 154, 155, 156, 158, 161, 163, 165, 169, 173, 174, 175, 177, 178], "true_": [16, 18], "trunc": [14, 18], "truncat": [2, 4, 9, 10, 11, 12, 14, 17, 18, 19, 20, 128, 131, 132, 133, 134, 153, 154, 155, 156, 157, 158, 159, 161, 163, 165, 167, 169, 173, 174, 175, 177, 178], "trunk": 169, "try": [141, 148, 155, 156, 158, 159, 163, 174], "tuckerbmorgan": 155, "tune": [148, 177], "tupl": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 137, 139, 140, 147, 150, 155, 156, 158, 159, 160, 163, 165, 174, 177, 178], "turbotimon": 156, "turbul": [129, 155], "turbulence_pow": [129, 178], "turn": [9, 11, 17, 128, 129, 142, 148, 155, 156], "tutori": [2, 15, 156, 159, 160, 161, 163, 164, 165, 166, 167, 168, 169, 172, 173, 174, 175, 176, 177, 178], "tutorials_jupyt": 170, "tutorials_python": 170, "tweak": [136, 146], "two": [2, 5, 6, 7, 9, 10, 17, 18, 20, 127, 129, 131, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 145, 146, 147, 148, 150, 155, 156, 159, 161, 162, 165, 174, 178], "txt": [1, 155], "type": [2, 4, 5, 6, 7, 10, 14, 16, 17, 18, 20, 128, 132, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 159, 160, 165, 167, 175, 177], "typeerror": 156, "typic": [2, 9, 154, 159, 161, 169, 173], "typo": [155, 156], "u": [5, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 159, 163, 165, 167, 174, 177], "uav": 148, "uint8": [18, 128], "un": 132, "unattach": [144, 145], "unbound": [7, 18], "uncertain": 148, "uncertainti": 148, "unclear": [156, 159], "uncom": 169, "uncommon": 156, "undefin": 2, "under": [2, 156, 174, 177], "underli": [2, 15, 17, 131, 156, 158], "underneath": [15, 132, 158], "underpow": 130, "underscor": [155, 160], "understand": [2, 8, 10, 144, 156, 159, 160], "undocu": 156, "uneven": 127, "unexpect": [11, 129, 155], "unflatten": [5, 8, 156], "unhealthi": [137, 139, 140, 142, 143, 147], "unicod": 9, "uniform": [5, 7, 8, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 175], "uniformli": [7, 131, 132, 154, 165], "uniniti": 159, "unintend": 156, "union": [6, 7, 19, 156], "uniqu": [6, 10, 126, 130, 136, 142, 155, 160], "unit": [5, 14, 18, 20, 129, 131, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148], "uniti": 148, "unitless": [142, 145], "unitre": 169, "unitree_go1": 169, "univers": [133, 134, 175], "unknown": [2, 9, 10, 148, 158], "unless": [7, 15, 150, 151, 152, 153, 154, 155, 165], "unlik": [6, 163, 177], "unmaintain": 156, "unmasked_mean_curv": 173, "unmasked_mean_reward": 173, "unmasked_overall_mean": 173, "unmasked_overall_std": 173, "unmasked_result": 173, "unmasked_results_list": 173, "unnecessari": [155, 156], "unnecessarili": 160, "unnescesari": 155, "unord": 5, "unpack": 160, "unpickl": [9, 13, 155, 156], "unplay": 9, "unreli": 160, "unsupport": 7, "untermin": 132, "until": [17, 144, 150, 151, 152, 153, 155, 156, 158, 163, 165, 175, 177, 178], "unus": [155, 159], "unusu": 161, "unwrap": [2, 10, 15, 131, 156, 158, 159], "up": [2, 6, 7, 10, 127, 129, 136, 137, 139, 140, 141, 147, 150, 151, 152, 153, 154, 156, 158, 159, 161, 163, 165, 169, 170, 173, 174, 175, 176], "updat": [1, 2, 3, 9, 14, 16, 17, 18, 19, 137, 139, 140, 147, 154, 155, 156, 158, 159, 160, 165, 166, 167, 173, 174, 175, 177, 178], "update_paramet": 178, "update_running_mean": [18, 19], "upfront": 160, "upgrad": [155, 156], "uph": 141, "uph_cost": 141, "uph_cost_weight": 141, "upload": 161, "upon": [133, 134, 160], "upper": [7, 14, 19, 20, 140, 141, 155, 158], "upright": [132, 135, 142, 143, 158], "upsid": 156, "upstream": 156, "urandom": 2, "urban": 148, "urdf": 169, "url": [155, 156, 178], "urldat": 156, "us": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 18, 19, 20, 126, 127, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 153, 154, 155, 156, 158, 160, 161, 162, 163, 166, 167, 169, 170, 173, 174, 176], "usabl": [150, 155, 163, 174], "usable_ac": [163, 174], "usag": [9, 156, 159, 160, 161, 163, 167], "use_action_mask": 173, "use_contact_forc": [137, 156], "use_cuda": 178, "useless": 169, "user": [2, 3, 4, 5, 9, 10, 12, 14, 18, 20, 131, 132, 133, 134, 135, 155, 156, 158, 160, 164, 165, 168, 170, 177], "usual": [2, 6, 7, 17, 139, 158, 163, 165, 167, 169, 174, 178], "util": [18, 148, 155, 156, 158, 159, 165, 178], "utilis": [10, 155], "utli": 156, "v": [4, 133, 134, 160, 173, 178], "v0": [2, 4, 9, 10, 14, 16, 17, 18, 19, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 159, 165, 166, 171, 177], "v1": [2, 4, 9, 10, 11, 12, 14, 16, 17, 18, 19, 127, 128, 129, 131, 132, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 158, 161, 163, 171, 174, 175], "v2": [127, 128, 129, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156], "v21": [155, 156, 160], "v24": 155, "v25": 155, "v26": [2, 156, 160, 177], "v28": 156, "v2g": 148, "v3": [9, 14, 17, 18, 127, 128, 129, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 154, 155, 156, 157, 158, 160, 167, 173, 178], "v4": [14, 15, 16, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 171, 177], "v5": [17, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 160, 169], "vairodp": 156, "val": 175, "valentin": 156, "valid": [2, 4, 5, 7, 10, 13, 14, 158, 163, 173, 174, 178], "valid_act": 173, "valid_next_act": 173, "vallei": [133, 134], "valu": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 127, 129, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 155, 156, 158, 160, 163, 165, 166, 169, 173, 174, 175, 177, 178], "value_funct": 160, "value_grid": 174, "value_pr": 178, "valueerror": [7, 8, 11, 12, 13, 17], "vampir": 148, "var": 19, "vari": [132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 177], "variabl": [2, 5, 7, 11, 13, 14, 15, 17, 136, 137, 139, 146, 147, 148, 155, 156, 158, 165, 166, 174, 177], "varianc": [14, 18, 19, 20, 173, 178], "variant": [128, 165], "variat": 136, "varieti": [9, 148], "variou": [5, 141, 148, 155, 177], "ve": [155, 156, 159, 163], "vec_env": [9, 159], "vecenvwrapp": 155, "vector": [2, 4, 7, 9, 11, 12, 16, 17, 18, 19, 127, 129, 142, 143, 145, 148, 155, 156, 158, 159, 161, 170, 176, 177], "vector_a2c": 178, "vector_entry_point": [4, 132, 156], "vector_env": 14, "vector_kwarg": 4, "vector_list_info": 155, "vectoractionwrapp": [14, 156], "vectorenv": [4, 5, 14, 155, 156], "vectorenvcr": 4, "vectorenvwrapp": 156, "vectoris": [5, 148], "vectorization_mod": [4, 9, 10, 11, 12, 14, 132, 156], "vectorizemod": 4, "vectorizetransformact": [14, 20], "vectorizetransformobserv": [14, 20], "vectorizetransformreward": [14, 20], "vectorizor": [4, 132], "vectorlistinfo": [14, 155, 156], "vectorobservationwrapp": [14, 156], "vectorrewardwrapp": [14, 156], "vectorwrapp": [14, 156], "vehicl": 148, "veloc": [2, 8, 13, 127, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 158, 159], "velocity_penalti": 142, "veri": [6, 129, 144, 155, 156, 158, 159, 162, 163, 165, 178], "verifi": [9, 159, 160, 163], "vermouth1992": [155, 156], "versa": [13, 17, 18, 160], "version": [1, 2, 4, 5, 14, 16, 17, 18, 19, 148, 155, 156, 159, 160, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "vertic": [127, 139, 141, 142, 143, 147, 159, 165], "vf_next_stat": 166, "vf_target": 166, "via": [5, 9, 14, 15, 17, 126, 130, 136, 148, 149, 158, 165, 177], "viabl": 174, "vicbentu": 156, "vice": [13, 17, 18, 160], "vicent": 156, "video": [1, 17, 20, 127, 155, 156, 158, 159, 161, 163, 169, 171, 175], "video0": 169, "video_fold": [9, 17, 161], "video_length": [9, 17], "video_path": 161, "videorecord": [17, 155, 156], "view": [2, 156, 159, 169], "view_init": 174, "viewer": [10, 11, 12, 156], "viewport": 129, "viewport_h": 129, "viewport_w": 129, "virgilt": 155, "viridi": 174, "viscou": 146, "visibl": 165, "visit": [128, 175], "visual": [148, 158, 159, 160, 161, 163, 169], "visual_env": 160, "visual_opt": [136, 156], "visualis": 2, "vizdoom": 148, "vmoen": [155, 156], "voidflight": 156, "vol": [131, 154], "volleybal": 148, "volunt": 156, "vscode": [156, 171], "vwxyzjn": 155, "vx": [14, 17, 129], "vy": 129, "w": [9, 137, 140, 141, 178], "w_": [137, 138, 139, 140, 141, 144, 145, 146, 147], "wa": [2, 4, 6, 9, 10, 14, 17, 18, 19, 132, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 155, 156, 159, 160, 163, 166, 167, 177, 178], "wai": [2, 13, 15, 17, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 158, 163, 166, 167, 174, 175, 178], "wait": [9, 10, 11, 155, 166], "wait_on_play": 9, "wake": 129, "walk": [136, 140, 147, 149, 153, 156, 159, 165, 169], "walker": [126, 145, 147, 155], "walker2d": [136, 156], "walker2d_v5": 147, "wall": [133, 134, 154, 159, 161, 173], "wandb": 161, "want": [1, 2, 4, 6, 11, 15, 17, 137, 140, 141, 155, 156, 158, 159, 160, 161, 165, 167, 169, 174, 175, 178], "ward": 177, "warehous": 148, "warn": [6, 9, 10, 11, 17, 144, 155, 156], "wasn": 17, "wast": 173, "watch": [1, 161, 163, 171], "water": 148, "wawrzy\u0144ski": 138, "we": [1, 2, 3, 4, 5, 7, 9, 13, 18, 148, 155, 156, 157, 158, 159, 160, 161, 162, 163, 165, 166, 167, 169, 173, 174, 177, 178], "web": 148, "websit": [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 136, 155, 156], "weigh": 137, "weight": [137, 138, 139, 140, 141, 144, 145, 146, 147, 148, 155, 161, 166, 167, 177], "well": [2, 5, 14, 131, 148, 155, 159, 163, 165, 175, 178], "were": [126, 131, 136, 154, 155, 156, 160, 163, 165, 169, 178], "weren": 160, "west": [154, 173], "what": [2, 5, 6, 148, 151, 152, 156, 159, 161, 162], "wheel": [126, 128, 155], "when": [2, 4, 5, 8, 9, 10, 11, 12, 13, 14, 17, 18, 20, 128, 129, 137, 139, 140, 141, 142, 143, 144, 147, 151, 152, 153, 154, 155, 156, 158, 159, 160, 163, 165, 166, 167, 169, 173, 175, 177, 178], "whenev": [17, 129, 165], "where": [1, 4, 6, 7, 8, 9, 14, 17, 128, 129, 131, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 165, 166, 167, 169, 173, 174, 175, 177, 178], "wherea": 175, "whether": [2, 3, 4, 5, 7, 9, 15, 17, 129, 137, 138, 139, 140, 141, 146, 147, 148, 150, 158, 159, 163, 165, 166, 174, 177], "which": [1, 2, 4, 5, 8, 9, 10, 14, 17, 18, 127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 150, 151, 152, 153, 154, 155, 156, 158, 159, 160, 162, 165, 166, 167, 169, 171, 173, 175, 177, 178], "while": [4, 8, 9, 11, 14, 17, 18, 19, 129, 131, 132, 135, 137, 140, 141, 146, 150, 151, 152, 155, 158, 159, 160, 161, 163, 165, 166, 173, 174, 175, 177, 178], "white": 155, "who": 156, "whole": [4, 155, 156, 169], "whose": [137, 150], "why": [129, 163], "wide": [148, 158], "width": [136, 156, 165], "wikipedia": 175, "wildli": 163, "willdudlei": 156, "william": [133, 134, 177], "win": [150, 163, 174], "win_rat": 163, "wind": [129, 155, 156], "wind_pow": [129, 155, 178], "window": [2, 9, 128, 136, 155, 156, 158, 160, 161, 163, 165], "window_s": 165, "wing": 148, "wire": 148, "wireless": 148, "wise": 177, "wish": [9, 155, 156], "within": [2, 5, 7, 9, 13, 14, 16, 17, 18, 20, 129, 130, 143, 155, 156, 158, 159], "without": [14, 15, 17, 19, 140, 148, 150, 153, 155, 156, 158, 159, 163, 165, 169, 173, 174], "won": [2, 163, 174], "word": [144, 177], "work": [5, 9, 128, 129, 131, 138, 139, 142, 143, 148, 155, 156, 158, 159, 160, 163], "worker": 11, "workflow": 156, "workshop": 148, "world": [129, 148, 151, 152, 153, 154, 156, 173, 175], "worldbodi": [137, 140, 141], "worri": 165, "wors": [155, 163], "would": [6, 8, 16, 18, 19, 137, 138, 139, 140, 146, 147, 155, 156, 157, 165, 167, 169, 178], "wouldn": 156, "wrap": [2, 4, 9, 11, 12, 14, 15, 16, 17, 18, 19, 20, 148, 158, 159, 165, 167, 177, 178], "wrapped_env": [14, 15, 16, 17, 18, 158, 159, 165, 167, 177], "wrapped_env_ob": 16, "wrapped_obs0": 18, "wrapped_obs1": 18, "wrappedenvacttyp": 156, "wrappedenvobstyp": 156, "wrapper": [2, 4, 6, 7, 9, 10, 13, 137, 138, 139, 140, 141, 143, 146, 147, 148, 153, 154, 155, 156, 158, 161, 163, 168, 170, 174, 177, 178], "wrapper_spec": 15, "wrapperacttyp": [15, 16], "wrapperobstyp": [15, 18], "wrapperspec": [4, 15], "wrist": 144, "write": [5, 11, 13, 156, 159, 165, 169], "write_to_shared_memori": [5, 13], "written": [9, 156, 162], "wrong": [155, 156, 158, 159, 160, 163], "www": [128, 150, 151, 152, 153, 155], "x": [2, 5, 8, 14, 129, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 147, 148, 151, 152, 156, 159, 161, 165, 175, 177, 178], "x_": [137, 138, 139, 140, 142, 146, 147], "x_init": 133, "x_posit": [14, 137, 138, 139, 140, 141, 146, 147], "x_veloc": 14, "xlabel": [161, 173], "xml": [137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 155, 156, 169], "xml_file": [136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 156, 169], "xp": 14, "xpo": [137, 140, 144, 145], "xtick": 174, "xticklabel": 175, "xuanhien070594": 156, "xuehaipan": [155, 156], "xx": 175, "xy": 142, "y": [2, 129, 135, 137, 138, 139, 140, 141, 142, 144, 145, 146, 154, 159, 175, 177], "y_": 142, "y_coordin": 142, "y_init": 133, "y_posit": [137, 138, 139, 140, 141, 146, 147], "yaniv": 156, "year": [133, 134, 155, 156], "yellow": 154, "yet": [148, 156], "yield": 13, "ylabel": [161, 173, 175], "you": [1, 2, 5, 6, 7, 8, 9, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 127, 128, 137, 140, 141, 148, 155, 156, 157, 158, 160, 161, 163, 165, 166, 167, 169, 171, 173, 175, 178], "youjiacheng": 155, "youni": [155, 156], "younik": [155, 156], "your": [1, 2, 5, 9, 11, 14, 15, 16, 17, 18, 128, 137, 140, 141, 148, 155, 156, 157, 162, 167, 168, 170, 174, 178], "your_env": 9, "yourself": [11, 128, 159, 165, 174], "ytick": 174, "yticklabel": 175, "z": [137, 138, 139, 140, 141, 142, 144, 145, 147], "z_": 141, "z_distance_from_origin": [139, 141, 147], "zaxi": 174, "zemann": [174, 178], "zenodo": 156, "zero": [7, 13, 18, 135, 137, 139, 140, 141, 147, 156, 163, 165, 166, 173, 174, 175, 177, 178], "zero_grad": [177, 178], "zhiqingxiao": 155, "zip": [170, 173], "zlig": 155, "zoom": 9, "zuoxingdong": 155, "zzyunzhi": 155, "\u03b1": 173, "\u03b3": 173, "\u03b5": 173}, "titles": ["404 - Page Not Found", "Gymnasium-docs", "Env", "Functional Env", "Make and register", "Spaces", "Composite Spaces", "Fundamental Spaces", "Spaces Utils", "Utility functions", "Vectorize", "AsyncVectorEnv", "SyncVectorEnv", "Utility functions", "Wrappers", "Wrappers", "Action Wrappers", "Misc Wrappers", "Observation Wrappers", "Reward Wrappers", "List of Wrappers", "Atari", "Adventure", "Air Raid", "Alien", "Amidar", "Assault", "Asterix", "Asteroids", "Atlantis", "Atlantis2", "Backgammon", "Bank Heist", "Basic Math", "Battle Zone", "Beam Rider", "Berzerk", "Blackjack", "Bowling", "Boxing", "Breakout", "Carnival", "Casino", "Centipede", "Chopper Command", "Crazy Climber", "Crossbow", "Darkchambers", "Defender", "Demon Attack", "Donkey Kong", "Double Dunk", "Earthworld", "Elevator Action", "Enduro", "Entombed", "Et", "Fishing Derby", "Flag Capture", "Freeway", "Frogger", "Frostbite", "Galaxian", "Gopher", "Gravitar", "Hangman", "Haunted House", "Hero", "Human Cannonball", "Ice Hockey", "Jamesbond", "Journey Escape", "Kaboom", "Kangaroo", "Keystone Kapers", "King Kong", "Klax", "Koolaid", "Krull", "Kung Fu Master", "Laser Gates", "Lost Luggage", "Mario Bros", "Miniature Golf", "Montezuma Revenge", "Mr Do", "Ms Pacman", "Name This Game", "Othello", "Pacman", "Phoenix", "Pitfall", "Pitfall2", "Pong", "Pooyan", "Private Eye", "Qbert", "Riverraid", "Road Runner", "Robotank", "Seaquest", "Sir Lancelot", "Skiing", "Solaris", "Space Invaders", "Space War", "Star Gunner", "Superman", "Surround", "Tennis", "Tetris", "Tic Tac Toe 3D", "Time Pilot", "Trondead", "Turmoil", "Tutankham", "Up N Down", "Venture", "Video Checkers", "Video Chess", "Video Cube", "Video Pinball", "Wizard Of Wor", "Word Zapper", "Yars Revenge", "Zaxxon", "Box2D", "Bipedal Walker", "Car Racing", "Lunar Lander", "Classic Control", "Acrobot", "Cart Pole", "Mountain Car", "Mountain Car Continuous", "Pendulum", "MuJoCo", "Ant", "Half Cheetah", "Hopper", "Humanoid", "Humanoid Standup", "Inverted Double Pendulum", "Inverted Pendulum", "Pusher", "Reacher", "Swimmer", "Walker2D", "External Environments", "Toy Text", "Blackjack", "Cliff Walking", "Cliff Walking Slippery", "Frozen Lake", "Taxi", "Gym Release Notes", "Gymnasium Release Notes", "<no title>", "Basic Usage", "Create a Custom Environment", "Gym Migration Guide", "Recording Agents", "Speeding Up Training", "Training an Agent", "Gymnasium Basics", "Make your own custom environment", "Handling Time Limits", "Implementing Custom Wrappers", "Gymnasium Basics", "Load custom quadruped robot environments", "Tutorials", "Third-Party Tutorials", "Training Agents", "Action Masking in the Taxi Environment", "Solving Blackjack with Tabular Q-Learning", "Solving Frozenlake with Tabular Q-Learning", "Training Agents", "Training using REINFORCE for Mujoco", "Speeding up A2C Training with Vector Envs"], "titleterms": {"0": [155, 156, 160, 169], "0a1": 156, "0a2": 156, "1": [155, 156, 160, 169], "11": 175, "12": 155, "19": 155, "2": [155, 156, 160, 169], "20": 155, "21": [155, 160], "22": 155, "23": 155, "24": 155, "25": 155, "26": [155, 156, 160], "27": 156, "28": 156, "29": 156, "3": [155, 156, 160, 169], "3d": 111, "4": [155, 160, 169, 175], "404": 0, "5": [155, 160], "6": 155, "7": [155, 175], "9": [155, 175], "Not": 0, "Of": 122, "The": [0, 160, 163, 175], "__init__": 159, "a2c": 178, "about": [159, 163, 171], "acrobot": 131, "across": 136, "action": [14, 16, 53, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159, 163, 173, 174], "actionwrapp": 167, "actor": 178, "ad": [1, 159], "add": 159, "addit": [4, 10, 11, 12], "advanc": 159, "advantag": 178, "adventur": 22, "agent": [158, 161, 163, 169, 170, 172, 174, 176, 177, 178], "agilerl": 171, "air": 23, "algorithm": 162, "alien": 24, "alpha": 156, "alpha1": 156, "altern": 165, "amidar": 25, "an": [1, 163, 174, 177], "analysi": [173, 178], "analyz": 163, "ant": 137, "api": [9, 160], "argument": [127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "assault": 26, "asterix": 27, "asteroid": 28, "asynchron": 178, "asyncvectorenv": 11, "atari": 21, "atlanti": 29, "atlantis2": 30, "attack": 49, "attribut": [2, 5, 10, 15], "autonom": 148, "avail": 16, "backend": 136, "backgammon": 31, "bank": 32, "base": [3, 16], "basic": [33, 158, 164, 168, 170], "battl": 34, "beam": 35, "befor": 159, "beginn": 158, "benchmark": 9, "benefit": 161, "berzerk": 36, "best": 161, "better": 174, "biolog": 148, "biped": 127, "blackjack": [37, 150, 163, 174], "boundari": 159, "bowl": 38, "box": 39, "box2d": 126, "breakdown": 160, "breakout": 40, "bro": 82, "build": [1, 163, 174, 177], "can": 174, "cannonbal": 68, "captur": 58, "car": [128, 133, 134], "carniv": 41, "cart": 132, "casino": 42, "centiped": 43, "chang": 160, "check": [9, 159], "checker": 118, "cheetah": 138, "chess": 119, "chopper": 44, "class": 16, "classic": 130, "cliff": [151, 152], "climber": 45, "close": 165, "code": [158, 159, 160, 166, 171], "command": 44, "common": [14, 17, 158, 159, 163], "compar": 136, "comparison": 160, "compat": [9, 160], "complet": 160, "complex": 159, "composit": [5, 6], "comput": 148, "construct": [159, 165], "continu": 134, "control": 130, "convers": [14, 17], "convert": 3, "core": 4, "could": 0, "crazi": 45, "creat": [2, 159, 165, 175], "credit": [127, 128, 129], "critic": 178, "crossbow": 46, "cube": 120, "curv": 177, "custom": [159, 165, 167, 169], "darkchamb": 47, "data": [14, 17], "debug": 159, "declar": 165, "defend": 48, "demon": 49, "derbi": 57, "descript": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "design": 159, "did": 160, "do": [85, 174], "doc": 1, "document": 1, "domain": 178, "done": 160, "donkei": 50, "doubl": [51, 142], "down": 116, "download": 169, "drive": 148, "dunk": 51, "dure": [161, 163], "dynam": [133, 134], "earthworld": 52, "econom": 148, "edit": 1, "electr": 148, "elev": 53, "end": [131, 132, 133, 134, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "enduro": 54, "energi": 148, "entomb": 55, "env": [2, 3, 165, 178], "environ": [1, 2, 3, 9, 10, 132, 148, 158, 159, 160, 162, 163, 165, 169, 173, 174, 175, 178], "epilogu": 169, "episod": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 161], "error": 159, "escap": 71, "et": 56, "evalu": 161, "everi": 161, "exact": 136, "exampl": 159, "execut": [163, 174], "expect": 163, "experi": [161, 173], "explain": 158, "exploit": 163, "explor": 163, "extern": 148, "ey": 95, "featur": 159, "financi": 148, "first": [148, 158], "fish": 57, "flag": 58, "found": 0, "freecodecamp": 171, "freewai": 59, "frogger": 60, "from": [165, 167, 171], "frostbit": 61, "frozen": 153, "frozenlak": 175, "fu": 79, "function": [3, 4, 5, 9, 13, 159, 160], "fundament": [5, 7], "galaxian": 62, "game": [87, 148], "gate": 80, "gener": [160, 165], "get": [160, 163], "golf": 83, "gopher": 63, "gradual": 159, "gravitar": 64, "gridworld": 159, "guid": 160, "gunner": 106, "gym": [148, 155, 160], "gymnasium": [1, 10, 148, 156, 158, 164, 165, 167, 168, 170, 171], "half": 138, "handl": [159, 166], "hangman": 65, "haunt": 66, "heist": 32, "help": 160, "helper": 160, "hero": 67, "heurist": 162, "histori": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "hockei": 69, "hopper": 139, "hous": 66, "how": 173, "human": 68, "humanoid": [140, 141], "i": 158, "ic": 69, "implement": [2, 14, 18, 19, 167], "import": [166, 174], "improv": 163, "includ": 160, "inform": [150, 151, 152, 153, 154, 161], "inherit": 167, "initi": [156, 158, 165], "instanc": 165, "instruct": 1, "integr": 161, "interpret": 163, "introduct": 178, "intuit": 163, "invad": 104, "invert": [142, 143], "issu": [158, 159, 163], "jamesbond": 70, "jax": 3, "johnni": 171, "journei": 71, "kaboom": 72, "kangaroo": 73, "kaper": 74, "kei": [159, 160], "keyston": 74, "king": 75, "klax": 76, "known": 159, "kong": [50, 75], "koolaid": 77, "krull": 78, "kung": 79, "lake": 153, "lancelot": 101, "lander": 129, "laser": 80, "learn": [158, 159, 163, 166, 174, 175, 177], "librari": 171, "limit": 166, "list": 20, "ll": 175, "load": [160, 169, 178], "loop": [158, 163], "lost": 81, "luggag": 81, "lunar": 129, "m": 86, "make": [4, 10, 159, 165], "manual": 159, "map": 175, "mario": 82, "mask": 173, "master": 79, "math": 33, "mathemat": 148, "medic": 148, "memori": 13, "method": [2, 5, 10, 11, 12, 15], "migrat": 160, "miniatur": 83, "misc": 17, "miscellan": 13, "mode": 160, "model": 169, "modifi": [1, 158], "montezuma": 84, "more": 161, "mountain": [133, 134], "mr": 85, "mujoco": [136, 177], "n": 116, "name": [87, 160], "network": 177, "never": 163, "new": [1, 9, 160], "next": [158, 159, 163], "note": [129, 146, 155, 156], "notic": 178, "number": 160, "observ": [14, 18, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159, 165, 169, 174], "observationwrapp": 167, "old": [9, 160], "onli": [14, 20], "openai": 160, "optim": 162, "othello": 88, "other": [1, 148], "output": 161, "own": 165, "packag": [160, 165], "pacman": [86, 89], "page": [0, 1], "paramet": [169, 175], "parameter": 159, "parti": [148, 171], "pendulum": [135, 142, 143], "perform": [9, 136, 178], "period": 161, "phoenix": 90, "pickl": 9, "pilot": 112, "pinbal": 121, "pitfal": [91, 159], "pitfall2": 92, "plai": 178, "plot": [177, 178], "pole": 132, "polici": [174, 177], "pong": 93, "poor": 163, "pooyan": 94, "practic": 161, "privat": 95, "problem": 159, "process": 163, "program": 158, "pusher": 144, "q": [163, 174, 175], "qbert": 96, "quadrup": 169, "question": 159, "quick": 160, "race": 128, "raid": 23, "random": [160, 178], "reacher": 145, "read": 160, "real": 159, "recommend": 165, "record": 161, "refer": [128, 131, 150, 151, 152, 154, 160, 175, 177, 178], "regist": [4, 159, 165], "reinforc": [158, 177], "releas": [155, 156], "remov": 160, "render": [9, 136, 159, 160, 165], "represent": 159, "reproduc": 136, "request": 0, "research": 159, "reset": [128, 159, 160, 165], "result": [163, 173], "reveng": [84, 124], "reward": [14, 19, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 159, 169], "rewardwrapp": 167, "rider": 35, "riverraid": 97, "rl": 158, "road": 98, "robot": [148, 169], "robotank": 99, "run": [173, 175], "runner": 98, "runtim": 9, "save": [9, 178], "seaquest": 100, "seed": [9, 160], "setup": [165, 169, 174, 178], "share": 13, "should": 160, "showcas": 178, "side": 160, "simpl": 159, "simul": 169, "sir": 101, "size": 175, "ski": 102, "slipperi": 152, "slow": 163, "solari": 103, "solut": [163, 165, 166], "solv": [174, 175], "space": [5, 6, 7, 8, 13, 104, 105, 127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 158, 159], "specif": 160, "speed": [162, 178], "split": 160, "standard": 3, "standup": 141, "star": 106, "start": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 159], "state": [127, 128, 129, 131, 132, 133, 134, 135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154, 159, 165], "step": [1, 9, 158, 159, 160, 163, 165, 169], "strategi": 163, "stuck": 163, "subclass": 165, "summari": 161, "superman": 107, "surround": 108, "swimmer": 146, "synchron": 178, "syncvectorenv": 12, "system": 148, "tabl": [160, 175], "tabular": [174, 175], "tac": 111, "taxi": [154, 173], "telecommun": 148, "tenni": 109, "termin": [127, 128, 129, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 160, 166, 169], "test": [159, 160, 163], "tetri": 110, "text": 149, "thi": [87, 160], "think": [159, 174], "third": [148, 171], "tic": 111, "time": [112, 166, 175], "timelimit": 160, "tip": 159, "toe": 111, "toi": 149, "too": 163, "track": 161, "train": [136, 161, 162, 163, 169, 170, 172, 174, 176, 177, 178], "transit": [133, 134], "trondead": 113, "truncat": [135, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 160, 166], "try": 178, "turmoil": 114, "tutankham": 115, "tutori": [1, 170, 171], "tweak": 169, "uncommon": 17, "understand": [158, 161, 163, 173], "unstabl": 163, "up": [116, 162, 178], "updat": 163, "us": [148, 159, 165, 171, 175, 177, 178], "usag": 158, "util": [5, 8, 9, 13], "v": 163, "v0": [155, 156, 160], "v1": [156, 160], "valid": 159, "variabl": 4, "vector": [5, 10, 13, 14, 20, 132, 162, 178], "vectorenv": 10, "ventur": 117, "version": [127, 128, 129, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 150, 151, 152, 153, 154], "video": [9, 118, 119, 120, 121, 148], "visual": [9, 173, 174, 175], "visualis": 174, "walk": [151, 152], "walker": 127, "walker2d": 147, "war": 105, "we": 175, "weight": 178, "what": [158, 163], "when": 161, "who": 160, "why": [158, 160, 161], "wizard": 122, "wor": 122, "word": 123, "work": 173, "world": 159, "wrapper": [14, 15, 16, 17, 18, 19, 20, 159, 160, 165, 167], "write": 1, "yar": 124, "you": [159, 174], "your": [158, 159, 160, 161, 163, 165, 169], "yourself": 178, "youtub": 171, "zapper": 123, "zaxxon": 125, "zone": 34}})