add defaults
This commit is contained in:
4
baselines/acer/defaults.py
Normal file
4
baselines/acer/defaults.py
Normal file
@@ -0,0 +1,4 @@
|
|||||||
|
def atari():
|
||||||
|
return dict(
|
||||||
|
lrschedule='constant'
|
||||||
|
)
|
22
baselines/ppo2/defaults.py
Normal file
22
baselines/ppo2/defaults.py
Normal file
@@ -0,0 +1,22 @@
|
|||||||
|
def mujoco():
|
||||||
|
return dict(
|
||||||
|
nsteps=2048,
|
||||||
|
nminibatches=32,
|
||||||
|
lam=0.95,
|
||||||
|
gamma=0.99,
|
||||||
|
noptepochs=10,
|
||||||
|
log_interval=1,
|
||||||
|
ent_coef=0.0,
|
||||||
|
lr=3e-4,
|
||||||
|
cliprange=0.2,
|
||||||
|
value_network='copy'
|
||||||
|
)
|
||||||
|
|
||||||
|
def atari():
|
||||||
|
return dict(
|
||||||
|
nsteps=128, nminibatches=4,
|
||||||
|
lam=0.95, gamma=0.99, noptepochs=4, log_interval=1,
|
||||||
|
ent_coef=.01,
|
||||||
|
lr=lambda f : f * 2.5e-4,
|
||||||
|
cliprange=lambda f : f * 0.1,
|
||||||
|
)
|
30
baselines/trpo_mpi/defaults.py
Normal file
30
baselines/trpo_mpi/defaults.py
Normal file
@@ -0,0 +1,30 @@
|
|||||||
|
from rl_common.models import mlp, cnn_small
|
||||||
|
|
||||||
|
|
||||||
|
def atari():
|
||||||
|
return dict(
|
||||||
|
network = cnn_small(),
|
||||||
|
timesteps_per_batch=512,
|
||||||
|
max_kl=0.001,
|
||||||
|
cg_iters=10,
|
||||||
|
cg_damping=1e-3,
|
||||||
|
gamma=0.98,
|
||||||
|
lam=1.0,
|
||||||
|
vf_iters=3,
|
||||||
|
vf_stepsize=1e-4,
|
||||||
|
entcoeff=0.00,
|
||||||
|
)
|
||||||
|
|
||||||
|
def mujoco():
|
||||||
|
return dict(
|
||||||
|
network = mlp(num_hidden=32, num_layers=2),
|
||||||
|
timesteps_per_batch=1024,
|
||||||
|
max_kl=0.01,
|
||||||
|
cg_iters=10,
|
||||||
|
cg_damping=0.1,
|
||||||
|
gamma=0.99,
|
||||||
|
lam=0.98,
|
||||||
|
vf_iters=5,
|
||||||
|
vf_stepsize=1e-3,
|
||||||
|
normalize_observations=True,
|
||||||
|
)
|
Reference in New Issue
Block a user