small fix

This commit is contained in:
pranz24
2019-09-10 22:29:35 +05:30
parent 6b6f64db37
commit c2d50837db
+2 -1
View File
@@ -102,7 +102,8 @@ class GaussianPolicy(nn.Module):
# Enforcing Action Bound
log_prob -= torch.log(self.action_scale * (1 - y_t.pow(2)) + epsilon)
log_prob = log_prob.sum(1, keepdim=True)
return action, log_prob, torch.tanh(mean)
mean = torch.tanh(mean) * self.action_scale + self.action_bias
return action, log_prob, mean
def to(self, device):
self.action_scale = self.action_scale.to(device)