diff --git a/python/ray/rllib/policy/tf_policy.py b/python/ray/rllib/policy/tf_policy.py index ed234f809..ef0de42e2 100644 --- a/python/ray/rllib/policy/tf_policy.py +++ b/python/ray/rllib/policy/tf_policy.py @@ -205,7 +205,7 @@ class TFPolicy(Policy): self._grads_and_vars) if log_once("loss_used"): - logger.info( + logger.debug( "These tensors were used in the loss_fn:\n\n{}\n".format( summarize(self._loss_input_dict))) diff --git a/python/ray/rllib/tuned_examples/halfcheetah-ddpg.yaml b/python/ray/rllib/tuned_examples/halfcheetah-ddpg.yaml index 6a4bd52e7..0513f7bf6 100644 --- a/python/ray/rllib/tuned_examples/halfcheetah-ddpg.yaml +++ b/python/ray/rllib/tuned_examples/halfcheetah-ddpg.yaml @@ -47,7 +47,6 @@ halfcheetah-ddpg: # === Parallelism === num_workers: 0 num_gpus_per_worker: 0 - optimizer_class: "SyncReplayOptimizer" per_worker_exploration: False worker_side_prioritization: False diff --git a/python/ray/rllib/tuned_examples/mountaincarcontinuous-ddpg.yaml b/python/ray/rllib/tuned_examples/mountaincarcontinuous-ddpg.yaml index 3a8f61229..87ce8eff5 100644 --- a/python/ray/rllib/tuned_examples/mountaincarcontinuous-ddpg.yaml +++ b/python/ray/rllib/tuned_examples/mountaincarcontinuous-ddpg.yaml @@ -47,7 +47,6 @@ mountaincarcontinuous-ddpg: # === Parallelism === num_workers: 0 num_gpus_per_worker: 0 - optimizer_class: "SyncReplayOptimizer" per_worker_exploration: False worker_side_prioritization: False diff --git a/python/ray/rllib/tuned_examples/pendulum-ddpg.yaml b/python/ray/rllib/tuned_examples/pendulum-ddpg.yaml index 59891a86b..a2ad295fb 100644 --- a/python/ray/rllib/tuned_examples/pendulum-ddpg.yaml +++ b/python/ray/rllib/tuned_examples/pendulum-ddpg.yaml @@ -47,7 +47,6 @@ pendulum-ddpg: # === Parallelism === num_workers: 0 num_gpus_per_worker: 0 - optimizer_class: "SyncReplayOptimizer" per_worker_exploration: False worker_side_prioritization: False