Fix behavior cloning due to API changes (#1014)
This commit is contained in:
@@ -23,7 +23,7 @@ from baselines.gail.dataset.mujoco_dset import Mujoco_Dset
|
||||
|
||||
def argsparser():
|
||||
parser = argparse.ArgumentParser("Tensorflow Implementation of Behavior Cloning")
|
||||
parser.add_argument('--env_id', help='environment ID', default='Hopper-v1')
|
||||
parser.add_argument('--env_id', help='environment ID', default='Hopper-v2')
|
||||
parser.add_argument('--seed', help='RNG seed', type=int, default=0)
|
||||
parser.add_argument('--expert_path', type=str, default='data/deterministic.trpo.Hopper.0.00.npz')
|
||||
parser.add_argument('--checkpoint_dir', help='the directory to save model', default='checkpoint')
|
||||
@@ -73,7 +73,7 @@ def learn(env, policy_func, dataset, optim_batch_size=128, max_iters=1e4,
|
||||
savedir_fname = tempfile.TemporaryDirectory().name
|
||||
else:
|
||||
savedir_fname = osp.join(ckpt_dir, task_name)
|
||||
U.save_state(savedir_fname, var_list=pi.get_variables())
|
||||
U.save_variables(savedir_fname, variables=pi.get_variables())
|
||||
return savedir_fname
|
||||
|
||||
|
||||
|
@@ -165,7 +165,7 @@ def runner(env, policy_func, load_model_path, timesteps_per_batch, number_trajs,
|
||||
U.initialize()
|
||||
# Prepare for rollouts
|
||||
# ----------------------------------------
|
||||
U.load_state(load_model_path)
|
||||
U.load_variables(load_model_path)
|
||||
|
||||
obs_list = []
|
||||
acs_list = []
|
||||
|
Reference in New Issue
Block a user