mirror of
https://github.com/wassname/ray.git
synced 2026-06-30 18:51:39 +08:00
[rllib] Support 1-dimensional action spaces (PPO) (#1347)
* Small fix for supporting custom preprocessors * PEP8 * Remove squeeze from actions
This commit is contained in:
@@ -155,7 +155,7 @@ class Runner(object):
|
||||
[trajectories["observations"],
|
||||
trajectories["value_targets"] if use_gae else dummy,
|
||||
trajectories["advantages"],
|
||||
trajectories["actions"].squeeze(),
|
||||
trajectories["actions"],
|
||||
trajectories["logprobs"],
|
||||
trajectories["vf_preds"] if use_gae else dummy],
|
||||
full_trace=full_trace)
|
||||
|
||||
Reference in New Issue
Block a user