diff --git a/python/ray/rllib/ppo/runner.py b/python/ray/rllib/ppo/runner.py index 47c89eccb..46b738ae5 100644 --- a/python/ray/rllib/ppo/runner.py +++ b/python/ray/rllib/ppo/runner.py @@ -155,7 +155,7 @@ class Runner(object): [trajectories["observations"], trajectories["value_targets"] if use_gae else dummy, trajectories["advantages"], - trajectories["actions"].squeeze(), + trajectories["actions"], trajectories["logprobs"], trajectories["vf_preds"] if use_gae else dummy], full_trace=full_trace)