mirror of
https://github.com/wassname/ray.git
synced 2026-06-27 21:38:18 +08:00
Use observation filter in compute_action for PPO. (#884)
This commit is contained in:
committed by
Philipp Moritz
parent
5d72818ddc
commit
60d4d01d06
@@ -266,4 +266,5 @@ class PolicyGradient(Algorithm):
|
||||
for (a, o) in zip(self.agents, extra_data[4])])
|
||||
|
||||
def compute_action(self, observation):
|
||||
observation = self.model.observation_filter(observation)
|
||||
return self.model.common_policy.compute([observation])[0][0]
|
||||
|
||||
Reference in New Issue
Block a user