mirror of
https://github.com/wassname/ray.git
synced 2026-06-30 10:33:24 +08:00
Fix APEX update target (#2300)
* apex hotfix small hotfix for Apex work * Also patch the dqn version
This commit is contained in:
committed by
Eric Liang
parent
0b6112b726
commit
739ddfa229
@@ -45,6 +45,6 @@ class ApexDDPGAgent(DDPGAgent):
|
||||
# Ape-X updates based on num steps trained, not sampled
|
||||
if self.optimizer.num_steps_trained - self.last_target_update_ts > \
|
||||
self.config["target_network_update_freq"]:
|
||||
self.local_evaluator.update_target()
|
||||
self.local_evaluator.for_policy(lambda p: p.update_target())
|
||||
self.last_target_update_ts = self.optimizer.num_steps_trained
|
||||
self.num_target_updates += 1
|
||||
|
||||
@@ -56,6 +56,6 @@ class ApexAgent(DQNAgent):
|
||||
# Ape-X updates based on num steps trained, not sampled
|
||||
if self.optimizer.num_steps_trained - self.last_target_update_ts > \
|
||||
self.config["target_network_update_freq"]:
|
||||
self.local_evaluator.update_target()
|
||||
self.local_evaluator.for_policy(lambda p: p.update_target())
|
||||
self.last_target_update_ts = self.optimizer.num_steps_trained
|
||||
self.num_target_updates += 1
|
||||
|
||||
Reference in New Issue
Block a user