fix incorrect critic loss in TD3 (#10775)

Co-authored-by: Manny Vindiola <manuel.m.vindiola.civ@mail.mil>
This commit is contained in:
mvindiola1
2020-09-20 23:01:51 -04:00
committed by GitHub
parent 3e94c690c7
commit 2b893d1bb5
3 changed files with 0 additions and 3 deletions
-1
View File
@@ -175,7 +175,6 @@ def ddpg_actor_critic_loss(policy, model, _, train_batch):
if twin_q:
td_error = q_t_selected - q_t_selected_target
twin_td_error = twin_q_t_selected - q_t_selected_target
td_error = td_error + twin_td_error
if use_huber:
errors = huber_loss(td_error, huber_threshold) + \
huber_loss(twin_td_error, huber_threshold)
-1
View File
@@ -124,7 +124,6 @@ def ddpg_actor_critic_loss(policy, model, _, train_batch):
if twin_q:
td_error = q_t_selected - q_t_selected_target
twin_td_error = twin_q_t_selected - q_t_selected_target
td_error = td_error + twin_td_error
if use_huber:
errors = huber_loss(td_error, huber_threshold) \
+ huber_loss(twin_td_error, huber_threshold)
-1
View File
@@ -495,7 +495,6 @@ class TestDDPG(unittest.TestCase):
td_error = q_t_selected - q_t_selected_target
twin_td_error = twin_q_t_selected - q_t_selected_target
td_error = td_error + twin_td_error
errors = huber_loss(td_error, huber_threshold) + \
huber_loss(twin_td_error, huber_threshold)