We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent a5e2e42 commit d93dd9eCopy full SHA for d93dd9e
rsl_rl/modules/student_teacher.py
@@ -92,7 +92,8 @@ def entropy(self):
92
93
def update_distribution(self, observations):
94
mean = self.student(observations)
95
- self.distribution = Normal(mean, mean * 0.0 + self.std)
+ std = self.std.expand_as(mean)
96
+ self.distribution = Normal(mean, std)
97
98
def act(self, observations):
99
self.update_distribution(observations)
0 commit comments