update pre-commit (#344)

This commit is contained in:
Mark Towers
2023-02-22 15:41:40 +00:00
committed by GitHub
parent a7d9146b1d
commit f9b81acf12
32 changed files with 47 additions and 59 deletions

View File

@@ -419,7 +419,6 @@ entropies = []
# use tqdm to get a progress bar for training
for sample_phase in tqdm(range(n_updates)):
# we don't have to reset the envs, they just continue playing
# until the episode is over and then reset automatically
@@ -435,7 +434,6 @@ for sample_phase in tqdm(range(n_updates)):
# play n steps in our parallel environments to collect data
for step in range(n_steps_per_update):
# select an action A_{t} using S_{t} as input for the agent
actions, action_log_probs, state_value_preds, entropy = agent.select_action(
states
@@ -674,7 +672,6 @@ for episode in range(n_showcase_episodes):
# play one episode
done = False
while not done:
# select an action A_{t} using S_{t} as input for the agent
with torch.no_grad():
action, _, _, _ = agent.select_action(state[None, :])