From 7cadef715facc8b0996735060015bb42e66540a7 Mon Sep 17 00:00:00 2001 From: Timo Kaufmann Date: Tue, 6 Aug 2019 01:02:21 +0200 Subject: [PATCH] Fix typo (#930) * Fix typo * Fix train_freq documentation Seems to be a copy-paste error, train_freq has nothing to do with printing. * Fix documentation typo --- baselines/deepq/build_graph.py | 2 +- baselines/deepq/deepq.py | 3 +-- 2 files changed, 2 insertions(+), 3 deletions(-) diff --git a/baselines/deepq/build_graph.py b/baselines/deepq/build_graph.py index 650449c..f7de316 100644 --- a/baselines/deepq/build_graph.py +++ b/baselines/deepq/build_graph.py @@ -13,7 +13,7 @@ The functions in this file can are used to create the following functions: stochastic: bool if set to False all the actions are always deterministic (default False) update_eps_ph: float - update epsilon a new value, if negative not update happens + update epsilon a new value, if negative no update happens (default: no update) Returns diff --git a/baselines/deepq/deepq.py b/baselines/deepq/deepq.py index b7b9d1a..14dfd19 100644 --- a/baselines/deepq/deepq.py +++ b/baselines/deepq/deepq.py @@ -142,9 +142,8 @@ def learn(env, final value of random action probability train_freq: int update the model every `train_freq` steps. - set to None to disable printing batch_size: int - size of a batched sampled from replay buffer for training + size of a batch sampled from replay buffer for training print_freq: int how often to print out training progress set to None to disable printing