diff --git a/baselines/ppo2/model.py b/baselines/ppo2/model.py index 3d5378a..af67999 100644 --- a/baselines/ppo2/model.py +++ b/baselines/ppo2/model.py @@ -137,7 +137,7 @@ class Model(object): if MPI is not None: sync_from_root(sess, global_variables) # pylint: disable=E1101 - def step_as_dict(self, **kwargs): + def step_with_dict(self, **kwargs): return self.act_model.step(**kwargs) def step(self, obs, M=None, S=None, **kwargs): diff --git a/baselines/ppo2/runner.py b/baselines/ppo2/runner.py index 1917dba..071de3a 100644 --- a/baselines/ppo2/runner.py +++ b/baselines/ppo2/runner.py @@ -49,7 +49,7 @@ class Runner(AbstractEnvRunner): transitions['dones'] = self.dones if 'next_states' in prev_transition: transitions['states'] = prev_transition['next_states'] - transitions.update(self.model.step_as_dict(**transitions)) + transitions.update(self.model.step_with_dict(**transitions)) # Take actions in env and look the results # Infos contains a ton of useful informations @@ -80,7 +80,7 @@ class Runner(AbstractEnvRunner): dtype = data_type[key] if key in data_type else np.float minibatch[key] = np.asarray(minibatch[key], dtype=dtype) - last_values = self.model.step_as_dict(**transitions)['values'] + last_values = self.model.step_with_dict(**transitions)['values'] # Calculate returns and advantages. minibatch['advs'], minibatch['returns'] = \