Compare commits

..

8 Commits

Author SHA1 Message Date
Peter Zhokhov
d1021f5885 Merge branch 'master' of https://github.com/openai/baselines into peterz_import_internal 2018-06-07 14:00:58 -07:00
Peter Zhokhov
6fd15ec92d adding missing tile_images.py 2018-06-07 13:59:58 -07:00
Peter Zhokhov
fab274b9af import internal 2018-06-06 10:34:05 -07:00
Peter Zhokhov
0392dda802 Merge branch 'master' of https://github.com/openai/baselines into peterz_import_internal 2018-06-06 10:33:45 -07:00
Peter Zhokhov
4dc709faae proper rng seeding in the test_identity 2018-05-21 14:46:49 -07:00
Peter Zhokhov
ea55240732 exported commit with identity test 2018-05-21 13:05:39 -07:00
Peter Zhokhov
3d7ed16f1f extra import of the baselines badge 2018-05-16 12:05:35 -07:00
Peter Zhokhov
efb071949e import rl-algs from 2e3a166 commit 2018-05-16 12:00:23 -07:00

View File

@@ -47,12 +47,18 @@ class Mujoco_Dset(object):
obs = traj_data['obs'][:traj_limitation]
acs = traj_data['acs'][:traj_limitation]
# obs, acs: shape (N, L, ) + S where N = # episodes, L = episode length
# and S is the environment observation/action space.
# Flatten to (N * L, prod(S))
self.obs = np.reshape(obs, [-1, np.prod(obs.shape[2:])])
self.acs = np.reshape(acs, [-1, np.prod(acs.shape[2:])])
def flatten(x):
# x.shape = (E,), or (E, L, D)
_, size = x[0].shape
episode_length = [len(i) for i in x]
y = np.zeros((sum(episode_length), size))
start_idx = 0
for l, x_i in zip(episode_length, x):
y[start_idx:(start_idx+l)] = x_i
start_idx += l
return y
self.obs = np.array(flatten(obs))
self.acs = np.array(flatten(acs))
self.rets = traj_data['ep_rets'][:traj_limitation]
self.avg_ret = sum(self.rets)/len(self.rets)
self.std_ret = np.std(np.array(self.rets))