changed default ppo2 lr schedule to linear RUN BENCHMARKS
This commit is contained in:
@@ -1 +1 @@
|
|||||||
ppo2_mpi
|
ppo2
|
||||||
|
@@ -7,7 +7,7 @@ def mujoco():
|
|||||||
noptepochs=10,
|
noptepochs=10,
|
||||||
log_interval=1,
|
log_interval=1,
|
||||||
ent_coef=0.0,
|
ent_coef=0.0,
|
||||||
lr=3e-4,
|
lr=lambda f: 3e-4 * f,
|
||||||
cliprange=0.2,
|
cliprange=0.2,
|
||||||
value_network='copy'
|
value_network='copy'
|
||||||
)
|
)
|
||||||
|
Reference in New Issue
Block a user