Revert "[rllib] Use NoFilter instead of MeanStdFilter for PPO. (#1082)" (#1255)

This reverts commit 971becc905.
This commit is contained in:
Eric Liang
2017-11-26 16:00:46 -08:00
committed by Richard Liaw
parent e583d5a421
commit 7fc2ddbaf7
2 changed files with 2 additions and 2 deletions
+1 -1
View File
@@ -57,7 +57,7 @@ DEFAULT_CONFIG = {
# Config params to pass to the model
"model": {"free_log_std": False},
# Which observation filter to apply to the observation
"observation_filter": "NoFilter",
"observation_filter": "MeanStdFilter",
# If >1, adds frameskip
"extra_frameskip": 1,
# Number of timesteps collected in each outer loop
+1 -1
View File
@@ -145,7 +145,7 @@ class Runner(object):
else:
raise Exception("Unknown observation_filter: " +
str(config["observation_filter"]))
self.reward_filter = NoFilter()
self.reward_filter = MeanStdFilter((), clip=5.0)
self.sess.run(tf.global_variables_initializer())
def load_data(self, trajectories, full_trace):