Fix APEX update target (#2300)

* apex hotfix

small hotfix for Apex work

* Also patch the dqn version
This commit is contained in:
Sergey Kolesnikov
2018-06-25 23:05:27 +03:00
committed by Eric Liang
parent 0b6112b726
commit 739ddfa229
2 changed files with 2 additions and 2 deletions
+1 -1
View File
@@ -45,6 +45,6 @@ class ApexDDPGAgent(DDPGAgent):
# Ape-X updates based on num steps trained, not sampled
if self.optimizer.num_steps_trained - self.last_target_update_ts > \
self.config["target_network_update_freq"]:
self.local_evaluator.update_target()
self.local_evaluator.for_policy(lambda p: p.update_target())
self.last_target_update_ts = self.optimizer.num_steps_trained
self.num_target_updates += 1
+1 -1
View File
@@ -56,6 +56,6 @@ class ApexAgent(DQNAgent):
# Ape-X updates based on num steps trained, not sampled
if self.optimizer.num_steps_trained - self.last_target_update_ts > \
self.config["target_network_update_freq"]:
self.local_evaluator.update_target()
self.local_evaluator.for_policy(lambda p: p.update_target())
self.last_target_update_ts = self.optimizer.num_steps_trained
self.num_target_updates += 1