mirror of
https://github.com/Farama-Foundation/Gymnasium.git
synced 2025-08-27 00:37:19 +00:00
35 lines
1.3 KiB
Python
35 lines
1.3 KiB
Python
![]() |
import time
|
||
|
from collections import deque
|
||
|
|
||
|
import gym
|
||
|
|
||
|
|
||
|
class RecordEpisodeStatistics(gym.Wrapper):
|
||
|
def __init__(self, env, deque_size=100):
|
||
|
super(RecordEpisodeStatistics, self).__init__(env)
|
||
|
self.t0 = time.time() # TODO: use perf_counter when gym removes Python 2 support
|
||
|
self.episode_return = 0.0
|
||
|
self.episode_length = 0
|
||
|
self.return_queue = deque(maxlen=deque_size)
|
||
|
self.length_queue = deque(maxlen=deque_size)
|
||
|
|
||
|
def reset(self, **kwargs):
|
||
|
observation = super(RecordEpisodeStatistics, self).reset(**kwargs)
|
||
|
self.episode_return = 0.0
|
||
|
self.episode_length = 0
|
||
|
return observation
|
||
|
|
||
|
def step(self, action):
|
||
|
observation, reward, done, info = super(RecordEpisodeStatistics, self).step(action)
|
||
|
self.episode_return += reward
|
||
|
self.episode_length += 1
|
||
|
if done:
|
||
|
info['episode'] = {'r': self.episode_return,
|
||
|
'l': self.episode_length,
|
||
|
't': round(time.time() - self.t0, 6)}
|
||
|
self.return_queue.append(self.episode_return)
|
||
|
self.length_queue.append(self.episode_length)
|
||
|
self.episode_return = 0.0
|
||
|
self.episode_length = 0
|
||
|
return observation, reward, done, info
|