diff --git a/python/ray/rllib/agents/a3c/a3c.py b/python/ray/rllib/agents/a3c/a3c.py index 48432e3df..63310c504 100644 --- a/python/ray/rllib/agents/a3c/a3c.py +++ b/python/ray/rllib/agents/a3c/a3c.py @@ -84,6 +84,6 @@ class A3CAgent(Agent): self.optimizer.step() result = self.optimizer.collect_metrics( self.config["collect_metrics_timeout"]) - result.update( - timesteps_this_iter=self.optimizer.num_steps_sampled - prev_steps) + result.update(timesteps_this_iter=self.optimizer.num_steps_sampled - + prev_steps) return result diff --git a/python/ray/rllib/agents/impala/impala.py b/python/ray/rllib/agents/impala/impala.py index 4a90953e0..c48ea1c58 100644 --- a/python/ray/rllib/agents/impala/impala.py +++ b/python/ray/rllib/agents/impala/impala.py @@ -111,6 +111,6 @@ class ImpalaAgent(Agent): self.optimizer.step() result = self.optimizer.collect_metrics( self.config["collect_metrics_timeout"]) - result.update( - timesteps_this_iter=self.optimizer.num_steps_sampled - prev_steps) + result.update(timesteps_this_iter=self.optimizer.num_steps_sampled - + prev_steps) return result diff --git a/python/ray/rllib/agents/pg/pg.py b/python/ray/rllib/agents/pg/pg.py index 2de0d9e1c..055a8faf4 100644 --- a/python/ray/rllib/agents/pg/pg.py +++ b/python/ray/rllib/agents/pg/pg.py @@ -51,6 +51,6 @@ class PGAgent(Agent): self.optimizer.step() result = self.optimizer.collect_metrics( self.config["collect_metrics_timeout"]) - result.update( - timesteps_this_iter=self.optimizer.num_steps_sampled - prev_steps) + result.update(timesteps_this_iter=self.optimizer.num_steps_sampled - + prev_steps) return result