Fixed inconsistent action placeholder (#5213)

2026-07-03 01:43:14 +08:00 · 2019-07-18 01:55:14 +08:00
parent 214f09d969
commit ae03c42dd6
1 changed files with 1 additions and 1 deletions
@@ -110,7 +110,7 @@ class MARWILPolicy(MARWILPostprocessing, TFPolicy):
        self.output_actions = action_dist.sample()

        # Training inputs
-        self.act_t = tf.placeholder(tf.int32, [None], name="action")
+        self.act_t = ModelCatalog.get_action_placeholder(action_space)
        self.cum_rew_t = tf.placeholder(tf.float32, [None], name="reward")

        # v network evaluation