[rllib] Support 1-dimensional action spaces (PPO) (#1347)

* Small fix for supporting custom preprocessors

* PEP8

* Remove squeeze from actions
This commit is contained in:
Cathy Wu
2017-12-19 14:17:06 -08:00
committed by Philipp Moritz
parent 6724f57b03
commit 772527caa4
+1 -1
View File
@@ -155,7 +155,7 @@ class Runner(object):
[trajectories["observations"],
trajectories["value_targets"] if use_gae else dummy,
trajectories["advantages"],
trajectories["actions"].squeeze(),
trajectories["actions"],
trajectories["logprobs"],
trajectories["vf_preds"] if use_gae else dummy],
full_trace=full_trace)