Update sac.py

2026-06-27 16:46:28 +08:00 · 2020-02-03 13:48:45 +05:30
parent 73064f31ea
commit 42d2ff08cb
1 changed files with 2 additions and 2 deletions
@@ -27,7 +27,7 @@ class SAC(object):

        if self.policy_type == "Gaussian":
            # Target Entropy = −dim(A) (e.g. , -6 for HalfCheetah-v2) as given in the paper
-            if self.automatic_entropy_tuning == True:
+            if self.automatic_entropy_tuning is True:
                self.target_entropy = -torch.prod(torch.Tensor(action_space.shape).to(self.device)).item()
                self.log_alpha = torch.zeros(1, requires_grad=True, device=self.device)
                self.alpha_optim = Adam([self.log_alpha], lr=args.lr)
@@ -43,7 +43,7 @@ class SAC(object):

    def select_action(self, state, eval=False):
        state = torch.FloatTensor(state).to(self.device).unsqueeze(0)
-        if eval == False:
+        if eval is False:
            action, _, _ = self.policy.sample(state)
        else:
            _, _, action = self.policy.sample(state)