We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent cd277d4 commit 596e38cCopy full SHA for 596e38c
rsl_rl/modules/actor_critic.py
@@ -101,7 +101,8 @@ def entropy(self):
101
102
def update_distribution(self, observations):
103
mean = self.actor(observations)
104
- self.distribution = Normal(mean, mean * 0.0 + self.std)
+ std = self.std.expand_as(mean)
105
+ self.distribution = Normal(mean, std)
106
107
def act(self, observations, **kwargs):
108
self.update_distribution(observations)
0 commit comments