diff --git a/baselines/gail/behavior_clone.py b/baselines/gail/behavior_clone.py index 82f65ec..aab1bc6 100644 --- a/baselines/gail/behavior_clone.py +++ b/baselines/gail/behavior_clone.py @@ -23,7 +23,7 @@ from baselines.gail.dataset.mujoco_dset import Mujoco_Dset def argsparser(): parser = argparse.ArgumentParser("Tensorflow Implementation of Behavior Cloning") - parser.add_argument('--env_id', help='environment ID', default='Hopper-v1') + parser.add_argument('--env_id', help='environment ID', default='Hopper-v2') parser.add_argument('--seed', help='RNG seed', type=int, default=0) parser.add_argument('--expert_path', type=str, default='data/deterministic.trpo.Hopper.0.00.npz') parser.add_argument('--checkpoint_dir', help='the directory to save model', default='checkpoint') @@ -73,7 +73,7 @@ def learn(env, policy_func, dataset, optim_batch_size=128, max_iters=1e4, savedir_fname = tempfile.TemporaryDirectory().name else: savedir_fname = osp.join(ckpt_dir, task_name) - U.save_state(savedir_fname, var_list=pi.get_variables()) + U.save_variables(savedir_fname, variables=pi.get_variables()) return savedir_fname diff --git a/baselines/gail/run_mujoco.py b/baselines/gail/run_mujoco.py index 379f7f8..e875c5c 100644 --- a/baselines/gail/run_mujoco.py +++ b/baselines/gail/run_mujoco.py @@ -165,7 +165,7 @@ def runner(env, policy_func, load_model_path, timesteps_per_batch, number_trajs, U.initialize() # Prepare for rollouts # ---------------------------------------- - U.load_state(load_model_path) + U.load_variables(load_model_path) obs_list = [] acs_list = []