I have no idea what I'm doing.

This commit is contained in:
pranz24
2020-06-06 22:56:10 +05:30
parent e5c349f0b0
commit ec004304a9
-6
View File
@@ -73,9 +73,6 @@ class SAC(object):
qf_loss.backward()
self.critic_optim.step()
for c_param in self.critic.parameters():
c_param.requires_grad = False
pi, log_pi, _ = self.policy.sample(state_batch)
qf1_pi, qf2_pi = self.critic(state_batch, pi)
@@ -87,9 +84,6 @@ class SAC(object):
policy_loss.backward()
self.policy_optim.step()
for c_param in self.critic.parameters():
c_param.requires_grad = True
if self.automatic_entropy_tuning:
alpha_loss = -(self.log_alpha * (log_pi + self.target_entropy).detach()).mean()