Merge pull request #268 from ei-grad/master
Fix fc call in AcerLstmPolicy
This commit is contained in:
@@ -59,9 +59,9 @@ class AcerLstmPolicy(object):
|
|||||||
h5, snew = lstm(xs, ms, S, 'lstm1', nh=nlstm)
|
h5, snew = lstm(xs, ms, S, 'lstm1', nh=nlstm)
|
||||||
h5 = seq_to_batch(h5)
|
h5 = seq_to_batch(h5)
|
||||||
|
|
||||||
pi_logits = fc(h5, 'pi', nact, act=lambda x: x, init_scale=0.01)
|
pi_logits = fc(h5, 'pi', nact, init_scale=0.01)
|
||||||
pi = tf.nn.softmax(pi_logits)
|
pi = tf.nn.softmax(pi_logits)
|
||||||
q = fc(h5, 'q', nact, act=lambda x: x)
|
q = fc(h5, 'q', nact)
|
||||||
|
|
||||||
a = sample(pi_logits) # could change this to use self.pi instead
|
a = sample(pi_logits) # could change this to use self.pi instead
|
||||||
self.initial_state = np.zeros((nenv, nlstm*2), dtype=np.float32)
|
self.initial_state = np.zeros((nenv, nlstm*2), dtype=np.float32)
|
||||||
|
Reference in New Issue
Block a user