2016-04-27 08:00:58 -07:00
import re
2019-03-08 14:50:32 -08:00
import importlib
2019-03-24 06:27:58 +09:00
import warnings
Cleanup, removal of unmaintained code (#836)
* add dtype to Box
* remove board_game, debugging, safety, parameter_tuning environments
* massive set of breaking changes
- remove python logging module
- _step, _reset, _seed, _close => non underscored method
- remove benchmark and scoring folder
* Improve render("human"), now resizable, closable window.
* get rid of default step and reset in wrappers, so it doesn’t silently fail for people with underscore methods
* CubeCrash unit test environment
* followup fixes
* MemorizeDigits unit test envrionment
* refactored spaces a bit
fixed indentation
disabled test_env_semantics
* fix unit tests
* fixes
* CubeCrash, MemorizeDigits tested
* gym backwards compatibility patch
* gym backwards compatibility, followup fixes
* changelist, add spaces to main namespaces
* undo_logger_setup for backwards compat
* remove configuration.py
2018-01-25 18:20:14 -08:00
from gym import error , logger
2016-04-27 08:00:58 -07:00
# This format is true today, but it's *not* an official spec.
2016-10-31 11:36:40 -07:00
# [username/](env-name)-v(version) env-name is group 1, version is group 2
#
# 2016-10-31: We're experimentally expanding the environment ID format
# to include an optional username.
2016-11-11 21:09:25 -08:00
env_id_re = re . compile ( r ' ^(?:[ \ w:-]+ \ /)?([ \ w:.-]+)-v( \ d+)$ ' )
2016-04-27 08:00:58 -07:00
2019-03-08 14:50:32 -08:00
2016-04-27 08:00:58 -07:00
def load ( name ) :
2019-03-08 14:50:32 -08:00
mod_name , attr_name = name . split ( " : " )
mod = importlib . import_module ( mod_name )
fn = getattr ( mod , attr_name )
return fn
2016-04-27 08:00:58 -07:00
class EnvSpec ( object ) :
""" A specification for a particular instance of the environment. Used
to register the parameters for official evaluations .
Args :
id ( str ) : The official environment ID
2016-05-02 14:33:55 -04:00
entry_point ( Optional [ str ] ) : The Python entrypoint of the environment class ( e . g . module . name : Class )
2016-04-27 08:00:58 -07:00
reward_threshold ( Optional [ int ] ) : The reward threshold before the task is considered solved
kwargs ( dict ) : The kwargs to pass to the environment class
2016-05-29 09:07:09 -07:00
nondeterministic ( bool ) : Whether this environment is non - deterministic even after seeding
2016-09-27 22:59:39 -07:00
tags ( dict [ str : any ] ) : A set of arbitrary key - value tags on this environment , including simple property = True tags
2019-05-25 00:55:40 +02:00
max_episode_steps ( Optional [ int ] ) : The maximum number of steps that an episode can consist of
2016-04-27 08:00:58 -07:00
Attributes :
id ( str ) : The official environment ID
"""
2019-04-26 23:30:14 +02:00
def __init__ ( self , id , entry_point = None , reward_threshold = None , kwargs = None , nondeterministic = False , tags = None , max_episode_steps = None ) :
2016-04-27 08:00:58 -07:00
self . id = id
# Evaluation parameters
self . reward_threshold = reward_threshold
2016-05-29 09:34:36 -07:00
# Environment properties
self . nondeterministic = nondeterministic
2019-07-12 13:59:33 -04:00
self . entry_point = entry_point
2016-10-31 11:36:40 -07:00
2016-09-27 23:13:11 -07:00
if tags is None :
2016-09-28 10:24:44 -07:00
tags = { }
self . tags = tags
2016-04-27 08:00:58 -07:00
2017-02-01 13:10:59 -08:00
tags [ ' wrapper_config.TimeLimit.max_episode_steps ' ] = max_episode_steps
2019-04-19 23:20:26 +02:00
2017-02-01 13:10:59 -08:00
self . max_episode_steps = max_episode_steps
2016-12-28 15:38:55 -08:00
2016-04-27 08:00:58 -07:00
# We may make some of these other parameters public if they're
# useful.
match = env_id_re . search ( id )
if not match :
raise error . Error ( ' Attempted to register malformed environment ID: {} . (Currently all IDs must be of the form {} .) ' . format ( id , env_id_re . pattern ) )
2016-05-18 12:08:27 -07:00
self . _env_name = match . group ( 1 )
2016-04-27 08:00:58 -07:00
self . _kwargs = { } if kwargs is None else kwargs
2019-01-29 13:37:43 -08:00
def make ( self , * * kwargs ) :
2016-04-27 08:00:58 -07:00
""" Instantiates an instance of the environment with appropriate kwargs """
2019-07-12 13:59:33 -04:00
if self . entry_point is None :
2016-05-06 22:26:40 -07:00
raise error . Error ( ' Attempting to make deprecated env {} . (HINT: is there a newer registered version of this env?) ' . format ( self . id ) )
2019-01-29 13:37:43 -08:00
_kwargs = self . _kwargs . copy ( )
_kwargs . update ( kwargs )
2019-07-12 13:59:33 -04:00
if callable ( self . entry_point ) :
env = self . entry_point ( * * _kwargs )
2017-09-18 11:25:12 -07:00
else :
2019-07-12 13:59:33 -04:00
cls = load ( self . entry_point )
2019-01-29 13:37:43 -08:00
env = cls ( * * _kwargs )
2016-04-27 08:00:58 -07:00
# Make the enviroment aware of which spec it came from.
Cleanup, removal of unmaintained code (#836)
* add dtype to Box
* remove board_game, debugging, safety, parameter_tuning environments
* massive set of breaking changes
- remove python logging module
- _step, _reset, _seed, _close => non underscored method
- remove benchmark and scoring folder
* Improve render("human"), now resizable, closable window.
* get rid of default step and reset in wrappers, so it doesn’t silently fail for people with underscore methods
* CubeCrash unit test environment
* followup fixes
* MemorizeDigits unit test envrionment
* refactored spaces a bit
fixed indentation
disabled test_env_semantics
* fix unit tests
* fixes
* CubeCrash, MemorizeDigits tested
* gym backwards compatibility patch
* gym backwards compatibility, followup fixes
* changelist, add spaces to main namespaces
* undo_logger_setup for backwards compat
* remove configuration.py
2018-01-25 18:20:14 -08:00
env . unwrapped . spec = self
2017-02-01 13:10:59 -08:00
2016-04-27 08:00:58 -07:00
return env
def __repr__ ( self ) :
return " EnvSpec( {} ) " . format ( self . id )
class EnvRegistry ( object ) :
""" Register an env by ID. IDs remain stable over time and are
guaranteed to resolve to the same environment dynamics ( or be
desupported ) . The goal is that results on a particular environment
should always be comparable , and not depend on the version of the
code that was running .
"""
def __init__ ( self ) :
self . env_specs = { }
2019-03-08 14:50:32 -08:00
def make ( self , path , * * kwargs ) :
2019-01-29 13:37:43 -08:00
if len ( kwargs ) > 0 :
2019-03-08 14:50:32 -08:00
logger . info ( ' Making new env: %s ( %s ) ' , path , kwargs )
2019-01-29 13:37:43 -08:00
else :
2019-03-08 14:50:32 -08:00
logger . info ( ' Making new env: %s ' , path )
spec = self . spec ( path )
2019-01-29 13:37:43 -08:00
env = spec . make ( * * kwargs )
2018-03-18 17:49:39 -07:00
# We used to have people override _reset/_step rather than
# reset/step. Set _gym_disable_underscore_compat = True on
# your environment if you use these methods and don't want
# compatibility code to be invoked.
if hasattr ( env , " _reset " ) and hasattr ( env , " _step " ) and not getattr ( env , " _gym_disable_underscore_compat " , False ) :
Cleanup, removal of unmaintained code (#836)
* add dtype to Box
* remove board_game, debugging, safety, parameter_tuning environments
* massive set of breaking changes
- remove python logging module
- _step, _reset, _seed, _close => non underscored method
- remove benchmark and scoring folder
* Improve render("human"), now resizable, closable window.
* get rid of default step and reset in wrappers, so it doesn’t silently fail for people with underscore methods
* CubeCrash unit test environment
* followup fixes
* MemorizeDigits unit test envrionment
* refactored spaces a bit
fixed indentation
disabled test_env_semantics
* fix unit tests
* fixes
* CubeCrash, MemorizeDigits tested
* gym backwards compatibility patch
* gym backwards compatibility, followup fixes
* changelist, add spaces to main namespaces
* undo_logger_setup for backwards compat
* remove configuration.py
2018-01-25 18:20:14 -08:00
patch_deprecated_methods ( env )
2019-04-19 23:20:26 +02:00
if ( env . spec . max_episode_steps is not None ) and not spec . tags . get ( ' vnc ' ) :
2017-02-01 13:10:59 -08:00
from gym . wrappers . time_limit import TimeLimit
2019-04-19 23:20:26 +02:00
env = TimeLimit ( env , max_episode_steps = env . spec . max_episode_steps )
2017-02-01 13:10:59 -08:00
return env
2016-04-27 08:00:58 -07:00
def all ( self ) :
return self . env_specs . values ( )
2019-03-08 14:50:32 -08:00
def spec ( self , path ) :
if ' : ' in path :
mod_name , _sep , id = path . partition ( ' : ' )
try :
importlib . import_module ( mod_name )
2019-03-24 06:27:58 +09:00
# catch ImportError for python2.7 compatibility
except ImportError :
2019-03-08 14:50:32 -08:00
raise error . Error ( ' A module ( {} ) was specified for the environment but was not found, make sure the package is installed with `pip install` before calling `gym.make()` ' . format ( mod_name ) )
else :
id = path
2016-04-27 08:00:58 -07:00
match = env_id_re . search ( id )
if not match :
raise error . Error ( ' Attempted to look up malformed environment ID: {} . (Currently all IDs must be of the form {} .) ' . format ( id . encode ( ' utf-8 ' ) , env_id_re . pattern ) )
try :
return self . env_specs [ id ]
except KeyError :
2016-05-18 02:23:43 -07:00
# Parse the env name and check to see if it matches the non-version
# part of a valid env (could also check the exact number here)
env_name = match . group ( 1 )
2016-05-18 12:08:27 -07:00
matching_envs = [ valid_env_name for valid_env_name , valid_env_spec in self . env_specs . items ( )
if env_name == valid_env_spec . _env_name ]
2016-05-18 02:23:43 -07:00
if matching_envs :
raise error . DeprecatedEnv ( ' Env {} not found (valid versions include {} ) ' . format ( id , matching_envs ) )
else :
raise error . UnregisteredEnv ( ' No registered env with id: {} ' . format ( id ) )
2016-04-27 08:00:58 -07:00
2016-05-02 14:33:55 -04:00
def register ( self , id , * * kwargs ) :
2016-04-27 08:00:58 -07:00
if id in self . env_specs :
raise error . Error ( ' Cannot re-register id: {} ' . format ( id ) )
2016-05-02 14:33:55 -04:00
self . env_specs [ id ] = EnvSpec ( id , * * kwargs )
2016-04-27 08:00:58 -07:00
# Have a global registry
registry = EnvRegistry ( )
2016-08-20 16:05:50 -07:00
def register ( id , * * kwargs ) :
return registry . register ( id , * * kwargs )
2019-01-29 13:37:43 -08:00
def make ( id , * * kwargs ) :
return registry . make ( id , * * kwargs )
2016-08-20 16:05:50 -07:00
def spec ( id ) :
return registry . spec ( id )
Cleanup, removal of unmaintained code (#836)
* add dtype to Box
* remove board_game, debugging, safety, parameter_tuning environments
* massive set of breaking changes
- remove python logging module
- _step, _reset, _seed, _close => non underscored method
- remove benchmark and scoring folder
* Improve render("human"), now resizable, closable window.
* get rid of default step and reset in wrappers, so it doesn’t silently fail for people with underscore methods
* CubeCrash unit test environment
* followup fixes
* MemorizeDigits unit test envrionment
* refactored spaces a bit
fixed indentation
disabled test_env_semantics
* fix unit tests
* fixes
* CubeCrash, MemorizeDigits tested
* gym backwards compatibility patch
* gym backwards compatibility, followup fixes
* changelist, add spaces to main namespaces
* undo_logger_setup for backwards compat
* remove configuration.py
2018-01-25 18:20:14 -08:00
warn_once = True
def patch_deprecated_methods ( env ) :
"""
Methods renamed from ' _method ' to ' method ' , render ( ) no longer has ' close ' parameter , close is a separate method .
For backward compatibility , this makes it possible to work with unmodified environments .
"""
global warn_once
if warn_once :
2018-03-18 17:49:39 -07:00
logger . warn ( " Environment ' %s ' has deprecated methods ' _step ' and ' _reset ' rather than ' step ' and ' reset ' . Compatibility code invoked. Set _gym_disable_underscore_compat = True to disable this behavior. " % str ( type ( env ) ) )
Cleanup, removal of unmaintained code (#836)
* add dtype to Box
* remove board_game, debugging, safety, parameter_tuning environments
* massive set of breaking changes
- remove python logging module
- _step, _reset, _seed, _close => non underscored method
- remove benchmark and scoring folder
* Improve render("human"), now resizable, closable window.
* get rid of default step and reset in wrappers, so it doesn’t silently fail for people with underscore methods
* CubeCrash unit test environment
* followup fixes
* MemorizeDigits unit test envrionment
* refactored spaces a bit
fixed indentation
disabled test_env_semantics
* fix unit tests
* fixes
* CubeCrash, MemorizeDigits tested
* gym backwards compatibility patch
* gym backwards compatibility, followup fixes
* changelist, add spaces to main namespaces
* undo_logger_setup for backwards compat
* remove configuration.py
2018-01-25 18:20:14 -08:00
warn_once = False
env . reset = env . _reset
env . step = env . _step
env . seed = env . _seed
def render ( mode ) :
return env . _render ( mode , close = False )
def close ( ) :
env . _render ( " human " , close = True )
env . render = render
env . close = close