From ae03c42dd6cd9c493814f149abff0324fadca190 Mon Sep 17 00:00:00 2001 From: Jones Wong Date: Thu, 18 Jul 2019 01:55:14 +0800 Subject: [PATCH] Fixed inconsistent action placeholder (#5213) --- python/ray/rllib/agents/marwil/marwil_policy.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/ray/rllib/agents/marwil/marwil_policy.py b/python/ray/rllib/agents/marwil/marwil_policy.py index 8c8eafba3..47ff12ebd 100644 --- a/python/ray/rllib/agents/marwil/marwil_policy.py +++ b/python/ray/rllib/agents/marwil/marwil_policy.py @@ -110,7 +110,7 @@ class MARWILPolicy(MARWILPostprocessing, TFPolicy): self.output_actions = action_dist.sample() # Training inputs - self.act_t = tf.placeholder(tf.int32, [None], name="action") + self.act_t = ModelCatalog.get_action_placeholder(action_space) self.cum_rew_t = tf.placeholder(tf.float32, [None], name="reward") # v network evaluation