mirror of
https://github.com/wassname/pytorch-soft-actor-critic.git
synced 2026-06-27 16:46:28 +08:00
small fix
This commit is contained in:
@@ -102,7 +102,8 @@ class GaussianPolicy(nn.Module):
|
||||
# Enforcing Action Bound
|
||||
log_prob -= torch.log(self.action_scale * (1 - y_t.pow(2)) + epsilon)
|
||||
log_prob = log_prob.sum(1, keepdim=True)
|
||||
return action, log_prob, torch.tanh(mean)
|
||||
mean = torch.tanh(mean) * self.action_scale + self.action_bias
|
||||
return action, log_prob, mean
|
||||
|
||||
def to(self, device):
|
||||
self.action_scale = self.action_scale.to(device)
|
||||
|
||||
Reference in New Issue
Block a user